import os import sys with open(sys.argv[0]) as f: code = f.read() # read the code of this file ASAP, for logging import uuid import time import copy from dataclasses import dataclass from functools import lru_cache from pathlib import Path os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True" import torch torch.empty(1, device="cuda", requires_grad=True).backward() # prevents a bug on some systems from torch import Tensor, nn import torch.nn.functional as F import torch.distributed as dist # use of FlexAttention contributed by @KoszarskyB from torch.nn.attention.flex_attention import BlockMask, flex_attention torch._inductor.config.coordinate_descent_tuning = True # we have banned this flag for new records because it causes compilation to take 30min # ----------------------------------------------------------------------------- # Custom operators: FP8 matmul by @YouJiacheng @torch.library.custom_op("nanogpt::mm", mutates_args=()) def mm_op(x: Tensor, w: Tensor, x_s: float, w_s: float, grad_s: float) -> tuple[Tensor, Tensor, Tensor]: @torch.compile def impl(x: Tensor, w: Tensor): assert x.is_contiguous() and w.is_contiguous() x_f8 = x.div(x_s).to(torch.float8_e4m3fn) w_f8 = w.div(w_s).to(torch.float8_e4m3fn) out = torch._scaled_mm( x_f8, w_f8.T, out_dtype=torch.bfloat16, scale_a=x.new_tensor(x_s, dtype=torch.float32), scale_b=x.new_tensor(w_s, dtype=torch.float32), use_fast_accum=True, ) return out, x_f8, w_f8 return impl(x, w) @mm_op.register_fake def _(x: Tensor, w: Tensor, *_): assert x.ndim == w.ndim == 2 assert x.shape[1] == w.shape[1] assert x.device == w.device assert x.is_contiguous() and w.is_contiguous() return x @ w.T, x.to(torch.float8_e4m3fn), w.to(torch.float8_e4m3fn) @torch.library.custom_op("nanogpt::mm_backward", mutates_args=()) def mm_backward_op(g: Tensor, x_f8: Tensor, w_f8: Tensor, x_s: float, w_s: float, grad_s: float) -> tuple[Tensor, Tensor]: @torch.compile def impl(grad: Tensor, x_f8: Tensor, w_f8: Tensor): assert grad.is_contiguous() x_inv_s = grad.new_tensor(x_s, dtype=torch.float32) w_inv_s = grad.new_tensor(w_s, dtype=torch.float32) grad_inv_s = grad.new_tensor(grad_s, dtype=torch.float32) grad_f8 = grad.div(grad_s).to(torch.float8_e5m2) grad_x = torch._scaled_mm( grad_f8, w_f8.T.contiguous().T, out_dtype=torch.bfloat16, scale_a=grad_inv_s, scale_b=w_inv_s, use_fast_accum=False, ) # faster than grad_f8_t @ x_f8, for (d_out, d_in) == (50304, 768) grad_w = torch._scaled_mm( x_f8.T.contiguous(), grad_f8.T.contiguous().T, out_dtype=torch.float32, scale_a=x_inv_s, scale_b=grad_inv_s, use_fast_accum=False, ).T return grad_x, grad_w return impl(g, x_f8, w_f8) @mm_backward_op.register_fake def _(g: Tensor, x_f8: Tensor, w_f8: Tensor, *_): return x_f8.to(torch.bfloat16), w_f8.T.contiguous().T.to(torch.float32) def backward(ctx, grad_out: Tensor, *_): x_f8, w_f8 = ctx.saved_tensors x_s, w_s, grad_s = ctx.scales grad_x, grad_w = torch.ops.nanogpt.mm_backward( grad_out, x_f8, w_f8, x_s, w_s, grad_s ) return grad_x, grad_w, None, None, None def setup_context(ctx: torch.autograd.function.FunctionCtx, inputs, output): *_, x_s, w_s, grad_s = inputs _, x_f8, w_f8 = output ctx.save_for_backward(x_f8, w_f8) ctx.scales = x_s, w_s, grad_s ctx.set_materialize_grads(False) mm_op.register_autograd(backward, setup_context=setup_context) # ----------------------------------------------------------------------------- # Muon optimizer @torch.compile def zeropower_via_newtonschulz5(G: Tensor, steps: int) -> Tensor: """ Newton-Schulz iteration to compute the zeroth power / orthogonalization of G. We opt to use a quintic iteration whose coefficients are selected to maximize the slope at zero. For the purpose of minimizing steps, it turns out to be empirically effective to keep increasing the slope at zero even beyond the point where the iteration no longer converges all the way to one everywhere on the interval. This iteration therefore does not produce UV^T but rather something like US'V^T where S' is diagonal with S_{ii}' ~ Uniform(0.5, 1.5), which turns out not to hurt model performance at all relative to UV^T, where USV^T = G is the SVD. """ assert G.ndim >= 2 # batched Muon implementation by @scottjmaddox, and put into practice in the record by @YouJiacheng X = G.bfloat16() if G.size(-2) > G.size(-1): X = X.mT # Ensure spectral norm is at most 1 X = X / (X.norm(dim=(-2, -1), keepdim=True) + 1e-7) # Perform the NS iterations for a, b, c in [ (4.0848, -6.8946, 2.9270), (3.9505, -6.3029, 2.6377), (3.7418, -5.5913, 2.3037), (2.8769, -3.1427, 1.2046), (2.8366, -3.0525, 1.2012), ]: A = X @ X.mT B = b * A + c * A @ A # quintic computation strategy adapted from suggestion by @jxbz, @leloykun, and @YouJiacheng X = a * X + B @ X if G.size(-2) > G.size(-1): X = X.mT return X class Muon(torch.optim.Optimizer): """ Muon - MomentUm Orthogonalized by Newton-schulz https://kellerjordan.github.io/posts/muon/ Muon internally runs standard SGD-momentum, and then performs an orthogonalization post- processing step, in which each 2D parameter's update is replaced with the nearest orthogonal matrix. To efficiently orthogonalize each update, we use a Newton-Schulz iteration, which has the advantage that it can be stably run in bfloat16 on the GPU. Some warnings: - This optimizer should not be used for the embedding layer, the final fully connected layer, or any {0,1}-D parameters; those should all be optimized by a standard method (e.g., AdamW). - To use it with 4D convolutional filters, it works well to just flatten their last 3 dimensions. Arguments: lr: The learning rate used by the internal SGD. momentum: The momentum used by the internal SGD. nesterov: Whether to use Nesterov-style momentum in the internal SGD. (recommended) ns_steps: The number of Newton-Schulz iteration steps to use. """ def __init__(self, params, lr=0.02, weight_decay=0.01, momentum=0.95, nesterov=True, ns_steps=5, rank=0, world_size=1): self.rank = rank self.world_size = world_size defaults = dict(lr=lr, weight_decay=weight_decay, momentum=momentum, nesterov=nesterov, ns_steps=ns_steps) params: list[Tensor] = [*params] param_groups = [] for size in {p.numel() for p in params}: b = torch.empty(world_size, size, dtype=torch.bfloat16, device="cuda") group = dict(params=[p for p in params if p.numel() == size], update_buffer=b, update_buffer_views=[b[i] for i in range(world_size)]) param_groups.append(group) super().__init__(param_groups, defaults) @torch.no_grad() def step(self): for group in self.param_groups: update_buffer: Tensor = group["update_buffer"] update_buffer_views: list[Tensor] = group["update_buffer_views"] # generate weight updates in distributed fashion params: list[Tensor] = group["params"] handle = None params_world = None def update_prev(): # optimized Muon implementation contributed by @YouJiacheng handle.wait() for p_world, g_world in zip(params_world, update_buffer_views): p_world.mul_(1 - group["lr"] * group["weight_decay"] * getattr(p_world, "wd_mul", 1.0)) p_world.add_(g_world.view_as(p_world), alpha=-group["lr"] * max(1, p_world.size(-2) / p_world.size(-1))**0.5) for base_i in range(len(params))[::self.world_size]: if base_i + self.rank < len(params): p = params[base_i + self.rank] g = p.grad assert g is not None state = self.state[p] if "momentum_buffer" not in state: state["momentum_buffer"] = torch.zeros_like(g) buf: Tensor = state["momentum_buffer"] buf.lerp_(g, 1 - group["momentum"]) g = g.lerp_(buf, group["momentum"]) if group["nesterov"] else buf g = zeropower_via_newtonschulz5(g, steps=group["ns_steps"]).flatten() else: g = update_buffer_views[self.rank] if base_i > 0: update_prev() # async all_gather instead of sync all_reduce by @YouJiacheng handle = dist.all_gather_into_tensor(update_buffer, g, async_op=True) params_world = params[base_i : base_i + self.world_size] update_prev() # ----------------------------------------------------------------------------- # PyTorch nn.Module definitions for the model def norm(x: Tensor): return F.rms_norm(x, (x.size(-1),)) class CastedLinear(nn.Linear): def __init__(self, in_features: int, out_features: int, use_fp8: bool = False, x_s: float = 1.0, w_s: float = 1.0, grad_s: float = 1.0): super().__init__(in_features, out_features, bias=False) self.use_fp8 = use_fp8 self.x_s = x_s self.w_s = w_s self.grad_s = grad_s def reset_parameters(self) -> None: std = 0.5 * (self.in_features ** -0.5) # 0.5 is a bit better than the default 1/sqrt(3) bound = (3 ** 0.5) * std with torch.no_grad(): self.weight.uniform_(-bound, bound) def forward(self, x: Tensor): if self.use_fp8 and self.training: _x = x.flatten(0, -2) out: Tensor = torch.ops.nanogpt.mm(_x, self.weight, x_s=self.x_s, w_s=self.w_s, grad_s=self.grad_s)[0] return out.reshape(*x.shape[:-1], -1) else: return F.linear(x, self.weight.type_as(x)) class Rotary(nn.Module): def __init__(self, dim: int, max_seq_len: int): super().__init__() # half-truncate RoPE by @YouJiacheng (w/ base freq tuning) angular_freq = (1 / 1024) ** torch.linspace(0, 1, steps=dim//4, dtype=torch.float32) angular_freq = torch.cat([angular_freq, angular_freq.new_zeros(dim//4)]) t = torch.arange(max_seq_len, dtype=torch.float32) theta = torch.einsum("i,j -> ij", t, angular_freq) self.cos = nn.Buffer(theta.cos(), persistent=False) self.sin = nn.Buffer(theta.sin(), persistent=False) def forward(self, x_BTHD: Tensor): assert self.cos.size(0) >= x_BTHD.size(-3) cos, sin = self.cos[None, :x_BTHD.size(-3), None, :], self.sin[None, :x_BTHD.size(-3), None, :] x1, x2 = x_BTHD.to(dtype=torch.float32).chunk(2, dim=-1) y1 = x1 * cos + x2 * sin y2 = x1 * (-sin) + x2 * cos return torch.cat((y1, y2), 3).type_as(x_BTHD) class CausalSelfAttention(nn.Module): def __init__(self, dim: int, num_heads: int, max_seq_len: int, head_dim=128): super().__init__() self.num_heads = num_heads self.head_dim = head_dim hdim = num_heads * head_dim std = 0.5 * (dim ** -0.5) bound = (3 ** 0.5) * std # improved init scale by @YouJiacheng # merged QKV weights: suggested by many, implemented by @fernbear.bsky.social, and further improved by @YouJiacheng # https://x.com/hi_tysam/status/1879699187107033311 self.qkv_w = nn.Parameter(torch.empty(3, hdim, dim).uniform_(-bound, bound)) self.lambdas = nn.Parameter(torch.tensor([0.5, 0.5])) self.rotary = Rotary(head_dim, max_seq_len) self.c_proj = CastedLinear(hdim, dim) self.c_proj.weight.detach().zero_() # zero init suggested by @Grad62304977 # scale the attention logits by given constant, instead of the default head_dim**-0.5, by @leloykun # inspired by learnable scalars used by @brendanh0gan https://x.com/hi_tysam/status/1879693583898591283 self.attn_scale = 0.12 def forward(self, x: Tensor, ve: Tensor | None, block_mask: BlockMask): B, T = x.size(0), x.size(1) # batch size, sequence length assert B == 1, "Must use batch size = 1 for FlexAttention" q, k, v = F.linear(x, self.qkv_w.flatten(end_dim=1).type_as(x)).view(B, T, 3 * self.num_heads, self.head_dim).chunk(3, dim=-2) q, k = norm(q), norm(k) # QK norm @Grad62304977 q, k = self.rotary(q), self.rotary(k) v = norm(v) if ve is not None: v = self.lambdas[0] * v + self.lambdas[1] * ve.view_as(v) # @KoszarskyB & @Grad62304977 else: # skip mid-layers token value embeddings by @YouJiacheng v = self.lambdas[0] * v y = flex_attention(q.transpose(1, 2), k.transpose(1, 2), v.transpose(1, 2), block_mask=block_mask, scale=self.attn_scale).transpose(1, 2) y = y.contiguous().view(B, T, self.num_heads * self.head_dim) # re-assemble all head outputs side by side y = self.c_proj(y) return y class MLP(nn.Module): def __init__(self, dim: int): super().__init__() hdim = 4 * dim self.c_fc = CastedLinear(dim, hdim) self.c_proj = CastedLinear(hdim, dim) self.c_proj.weight.detach().zero_() # zero init suggested by @Grad62304977 self.c_fc.weight.wd_mul = 2.0 self.c_proj.weight.wd_mul = 2.0 def forward(self, x: Tensor): x = self.c_fc(x) x = F.relu(x).square() # https://arxiv.org/abs/2109.08668v2; ~1-2% better than GELU; suggested by @SKYLINEZ007 and @Grad62304977 x = self.c_proj(x) return x class Block(nn.Module): def __init__(self, dim: int, num_heads: int, max_seq_len: int, layer_idx: int): super().__init__() # skip attention of blocks.7 (the 8th layer) by @YouJiacheng self.attn = CausalSelfAttention(dim, num_heads, max_seq_len) if layer_idx != 7 else None self.mlp = MLP(dim) self.lambdas = nn.Parameter(torch.tensor([1.0, 0.0])) self.record = nn.Buffer(torch.tensor([0.0, 0.0, 0.0])) def forward(self, x: Tensor, ve: Tensor | None, x0: Tensor, block_mask: BlockMask): x = self.lambdas[0] * x + self.lambdas[1] * x0 if not self.training: self.record[0].lerp_(torch.square(x).mean(dtype=torch.float32), 0.5) if self.attn is not None: z = self.attn(x, ve, block_mask) if not self.training: self.record[1].lerp_(torch.square(z).mean(dtype=torch.float32), 0.5) x = x + z z = self.mlp(norm(x)) if not self.training: self.record[2].lerp_(torch.square(z).mean(dtype=torch.float32), 0.5) x = x + z return x # ----------------------------------------------------------------------------- # The main model def next_multiple_of_n(v: float | int, *, n: int): return next(x for x in range(n, int(v) + 1 + n, n) if x >= v) class GPT(nn.Module): def __init__(self, vocab_size: int, num_layers: int, num_heads: int, model_dim: int, max_seq_len: int): super().__init__() self.embed = nn.Embedding(vocab_size, model_dim) # token value embeddings by @KoszarskyB - inspired by @Grad62304977's value residual implementation following https://arxiv.org/abs/2410.17897 # value embedding code simplification inspired by @ragulpr https://github.com/KellerJordan/modded-nanogpt/pull/78 self.value_embeds = nn.ModuleList([nn.Embedding(vocab_size, model_dim) for _ in range(3)]) self.blocks = nn.ModuleList([Block(model_dim, num_heads, max_seq_len, i) for i in range(num_layers)]) # there are only 50257 unique GPT-2 tokens; we extend to nearest multiple of 128 for efficiency. # suggested to me by @Grad62304977. this originates from Karpathy's experiments. self.lm_head = CastedLinear(model_dim, next_multiple_of_n(vocab_size, n=128), use_fp8=True, x_s=0.5, w_s=2**-9, grad_s=2**-19) self.lm_head.weight.detach().zero_() # @Grad62304977 # Add learnable skip connection weights for decoder layers assert num_layers % 2 == 0 self.skip_weights = nn.Parameter(torch.ones(num_layers//2)) def create_blockmasks(self, input_seq: Tensor, sliding_window_num_blocks: Tensor): BLOCK_SIZE = 128 docs = (input_seq == 50256).cumsum(0) def document_causal(b, h, q_idx, kv_idx): causal_mask = q_idx >= kv_idx document_mask = docs[q_idx] == docs[kv_idx] return causal_mask & document_mask def dense_to_ordered(dense_blockmask: Tensor): num_blocks = dense_blockmask.sum(dim=-1, dtype=torch.int32) indices = dense_blockmask.argsort(dim=-1, descending=False, stable=True).flip(-1).to(torch.int32) return num_blocks[None, None].contiguous(), indices[None, None].contiguous() # manual block mask creation by @YouJiacheng assert len(input_seq) % BLOCK_SIZE == 0 NUM_BLOCKS = len(input_seq) // BLOCK_SIZE block_idx = torch.arange(NUM_BLOCKS, dtype=torch.int32, device="cuda") causal_blockmask_any = block_idx[:, None] >= block_idx causal_blockmask_all = block_idx[:, None] > block_idx docs_low = docs.view(-1, BLOCK_SIZE)[:, 0].contiguous() docs_high = docs.view(-1, BLOCK_SIZE)[:, -1].contiguous() document_blockmask_any = (docs_low[:, None] <= docs_high) & (docs_high[:, None] >= docs_low) document_blockmask_all = (docs_low[:, None] == docs_high) & (docs_high[:, None] == docs_low) blockmask_any = causal_blockmask_any & document_blockmask_any blockmask_all = causal_blockmask_all & document_blockmask_all partial_kv_num_blocks, partial_kv_indices = dense_to_ordered(blockmask_any & ~blockmask_all) full_kv_num_blocks, full_kv_indices = dense_to_ordered(blockmask_all) def build_bm(window_size_blocks: Tensor) -> BlockMask: return BlockMask.from_kv_blocks( torch.clamp_max(partial_kv_num_blocks, torch.clamp_min(window_size_blocks - full_kv_num_blocks, 1)), partial_kv_indices, torch.clamp_max(full_kv_num_blocks, window_size_blocks - 1), full_kv_indices, BLOCK_SIZE=BLOCK_SIZE, mask_mod=document_causal, ) # Long-short SWA block masks by @leloykun & @YouJiacheng, adapated from suggestion by @Grad62304977, following Gemma 2 paper return build_bm(sliding_window_num_blocks), build_bm(sliding_window_num_blocks // 2) def forward(self, input_seq: Tensor, target_seq: Tensor, sliding_window_num_blocks: Tensor): assert input_seq.ndim == 1 ve = [value_embed(input_seq) for value_embed in self.value_embeds] # 012 ... 012 structure on token value embeddings by @YouJiacheng, improved on @leloykun's U-net structure ve = [ve[0], ve[1], ve[2]] + [None] * (len(self.blocks) - 6) + [ve[0], ve[1], ve[2]] assert len(ve) == len(self.blocks) long_bm, short_bm = self.create_blockmasks(input_seq, sliding_window_num_blocks) block_masks = [long_bm, short_bm, short_bm, short_bm, long_bm, short_bm, short_bm, short_bm, short_bm, short_bm, short_bm, long_bm, short_bm, short_bm, short_bm, long_bm] assert len(block_masks) == len(self.blocks) x = x0 = norm(self.embed(input_seq)[None]) # use of norm here by @Grad62304977 # U-net design by @brendanh0gan skip_connections = [] n = len(self.skip_weights) skip_map = { 9: 6, 10: 4, 11: 2, } for i in range(len(self.blocks)): if i in skip_map: x = x + self.skip_weights[skip_map[i]] * skip_connections[skip_map[i]] x = self.blocks[i](x, ve[i], x0, block_masks[i]) if i < n: skip_connections.append(x) x = norm(x) logits = self.lm_head(x) # @Grad62304977 added tanh softcapping following Gemma 2 paper, @KoszarskyB reduced it from 30 to 15, @YouJiacheng shifted it by +15 (2*sigmoid(2*x)=tanh(x)+1) logits = 30 * torch.sigmoid(logits.float() / 7.5) loss = F.cross_entropy(logits.view(-1, logits.size(-1)), target_seq) return loss # ----------------------------------------------------------------------------- # Our own simple Distributed Data Loader def _load_data_shard(file: Path): header = torch.from_file(str(file), False, 256, dtype=torch.int32) # header is 256 int32 assert header[0] == 20240520, "magic number mismatch in the data .bin file" assert header[1] == 1, "unsupported version" num_tokens = int(header[2]) # number of tokens (claimed) with file.open("rb", buffering=0) as f: tokens = torch.empty(num_tokens, dtype=torch.uint16, pin_memory=True) # avoid pin_memory copy by @YouJiacheng f.seek(256 * 4) nbytes = f.readinto(tokens.numpy()) # avoid bytes->array copy by @YouJiacheng assert nbytes == 2 * num_tokens, "number of tokens read does not match header" return tokens def distributed_data_generator(filename_pattern: str, batch_size: int, rank : int, world_size : int): files = sorted(Path.cwd().glob(filename_pattern)) assert batch_size % world_size == 0 local_batch_size = batch_size // world_size file_iter = iter(files) # use itertools.cycle(files) instead if you want to do multi-epoch training tokens, pos = _load_data_shard(next(file_iter)), 0 while True: if pos + batch_size + 1 >= len(tokens): tokens, pos = _load_data_shard(next(file_iter)), 0 buf = tokens[pos + rank * local_batch_size:][:local_batch_size + 1] inputs = buf[:-1].to(device="cuda", dtype=torch.int32, non_blocking=True) # no sync on host side; targets = buf[1:].to(device="cuda", dtype=torch.int64, non_blocking=True) # H2D in another stream isn't helpful. pos += batch_size yield inputs, targets # ----------------------------------------------------------------------------- # int main @dataclass class Hyperparameters: # data train_files = "data/fineweb10B/fineweb_train_*.bin" # input .bin to train on val_files = "data/fineweb10B/fineweb_val_*.bin" # input .bin to eval validation loss on val_tokens = 10485760 # how many tokens of validation data? it's important to keep this fixed for consistent comparisons train_seq_len = 64*1024 # FlexAttention sequence length val_seq_len = 4*64*1024 # FlexAttention sequence length for validation # optimization num_iterations = 6710 # number of iterations to run cooldown_frac = 0.6 # fraction of training spent cooling down the learning rate # architecture vocab_size = 50257 # evaluation and logging val_loss_every = 125 # every how many steps to evaluate val loss? 0 for only at the end save_checkpoint = False args = Hyperparameters() # torchrun sets these env variables rank = int(os.environ["RANK"]) world_size = int(os.environ["WORLD_SIZE"]) assert world_size == 8 # this code is designed for 8xH100 assert torch.cuda.is_available() device = torch.device("cuda", int(os.environ["LOCAL_RANK"])) torch.cuda.set_device(device) dist.init_process_group(backend="nccl", device_id=device) dist.barrier() master_process = (rank == 0) # this process will do logging, checkpointing etc. # begin logging logfile = None if master_process: run_id = uuid.uuid4() os.makedirs("logs", exist_ok=True) logfile = f"logs/{run_id}.txt" print(logfile) def print0(s, console=False): if master_process: with open(logfile, "a") as f: if console: print(s) print(s, file=f) # begin by printing this file (the Python code) print0(code) print0("="*100) # log information about the hardware/software environment this is running on print0(f"Running Python {sys.version}") print0(f"Running PyTorch {torch.version.__version__} compiled for CUDA {torch.version.cuda}") def nvidia_smi(): import subprocess # avoid top level import return subprocess.run(["nvidia-smi"], stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True).stdout print0(nvidia_smi()) print0("="*100) ######################################## # Construct model and optimizer # ######################################## model: nn.Module = GPT(vocab_size=args.vocab_size, num_layers=16, num_heads=8, model_dim=1024, max_seq_len=max(args.train_seq_len, args.val_seq_len)).cuda() for m in model.modules(): if isinstance(m, nn.Embedding): m.bfloat16() for param in model.parameters(): dist.broadcast(param.detach(), 0) # collect the parameters to optimize hidden_matrix_params = [p for n, p in model.blocks.named_parameters() if p.ndim >= 2 and "embed" not in n] embed_params = [p for n, p in model.named_parameters() if "embed" in n] scalar_params = [p for p in model.parameters() if p.ndim < 2] head_params: list[nn.Parameter] = [model.lm_head.weight] # init the optimizer(s) adam_param_groups = [dict(params=head_params, lr=0.1/1024**0.5), dict(params=embed_params, lr=0.3), dict(params=scalar_params, lr=0.015)] # small adam epsilon by @YouJiacheng. this is an alternate method of fixing the world_size dependence # discovered by @fernbear.bsky.social https://x.com/hi_tysam/status/1879692937589875094 optimizer1 = torch.optim.Adam(adam_param_groups, betas=(0.8, 0.95), eps=1e-10, fused=True) optimizer2 = Muon(hidden_matrix_params, lr=0.025, momentum=0.95, rank=rank, world_size=world_size) optimizers: list[torch.optim.Optimizer] = [optimizer1, optimizer2] def opt_params(opt: torch.optim.Optimizer) -> list[nn.Parameter]: return [p for group in opt.param_groups for p in group["params"]] opt2params = {opt: opt_params(opt) for opt in optimizers} for opt in optimizers: for group in opt.param_groups: group["initial_lr"] = group["lr"] # learning rate schedule: stable then decay def get_lr(step: int): x = step / args.num_iterations # progress in training assert 0 <= x < 1 if x < 1 - args.cooldown_frac: return 1.0 else: return (1 - x) / args.cooldown_frac # attention window size schedule: linearly increase @lru_cache(1) def get_window_size_blocks_helper(window_size: int): return torch.tensor(window_size // 128, dtype=torch.int32, pin_memory=True).cuda(non_blocking=True) def get_window_size_blocks(step: int): x = step / args.num_iterations # progress in training assert 0 <= x <= 1 # Linearly increase the block-wise sliding window size over training 128 -> 1792 # increase by @fernbear.bsky.social; block-wise by @YouJiacheng window_size = next_multiple_of_n(1728 * x, n=128) return get_window_size_blocks_helper(window_size) model: nn.Module = torch.compile(model, dynamic=False) ######################################## # Warmup kernels # ######################################## # Warmup the training kernels, then re-initialize the state so we aren't cheating warmup_steps = 10 initial_state = dict(model=copy.deepcopy(model.state_dict()), optimizers=[copy.deepcopy(opt.state_dict()) for opt in optimizers]) # save the initial state for _ in range(warmup_steps): inputs = targets = torch.randint(0, args.vocab_size, size=(args.train_seq_len,), device="cuda") model(inputs.to(torch.int32), targets, get_window_size_blocks(0)).backward() for param in model.parameters(): dist.all_reduce(param.grad, op=dist.ReduceOp.AVG) for opt in optimizers: opt.step() model.zero_grad(set_to_none=True) model.load_state_dict(initial_state["model"]) for opt, opt_state in zip(optimizers, initial_state["optimizers"]): opt.load_state_dict(opt_state) del initial_state ######################################## # Training and validation # ######################################## torch.cuda.reset_peak_memory_stats() train_loader = distributed_data_generator(args.train_files, world_size * args.train_seq_len, rank, world_size) training_time_ms = 0 # start the clock torch.cuda.synchronize() t0 = time.perf_counter() # begin training train_steps = args.num_iterations for step in range(train_steps + 1): last_step = (step == train_steps) # --------------- VALIDATION SECTION ----------------- if last_step or (args.val_loss_every > 0 and step % args.val_loss_every == 0): # stop the clock torch.cuda.synchronize() training_time_ms += 1000 * (time.perf_counter() - t0) model.eval() val_batch_size = world_size * args.val_seq_len assert args.val_tokens % val_batch_size == 0 val_steps = args.val_tokens // val_batch_size val_loader = distributed_data_generator(args.val_files, val_batch_size, rank, world_size) val_loss = 0 with torch.no_grad(): for _ in range(val_steps): inputs, targets = next(val_loader) val_loss += model(inputs, targets, get_window_size_blocks(step)) val_loss /= val_steps del val_loader dist.all_reduce(val_loss, op=dist.ReduceOp.AVG) print0(f"step:{step}/{train_steps} val_loss:{val_loss:.6f} train_time:{training_time_ms:.0f}ms step_avg:{training_time_ms/max(step, 1):.2f}ms", console=True) if hasattr(model, "skip_weights"): print0(s=f"{model.skip_weights}") print0(s="\n".join([f"{i} {block.lambdas.tolist()}" for i, block in enumerate(model.blocks)])) print0(s="\n".join([f"{i} {block.record.sqrt().tolist()}" for i, block in enumerate(model.blocks)])) model.train() # start the clock again torch.cuda.synchronize() t0 = time.perf_counter() if last_step: if master_process and args.save_checkpoint: log = dict(step=step, code=code, model=model.state_dict(), optimizers=[opt.state_dict() for opt in optimizers]) os.makedirs(f"logs/{run_id}", exist_ok=True) torch.save(log, f"logs/{run_id}/state_step{step:06d}.pt") # the last step only has the validation loop, so break to avoid training break # --------------- TRAINING SECTION ----------------- inputs, targets = next(train_loader) model(inputs, targets, get_window_size_blocks(step)).backward() opt2works = { opt: [dist.all_reduce(p.grad, op=dist.ReduceOp.AVG, async_op=True) for p in params] for opt, params in opt2params.items() } # set optimization hyperparameters for opt in optimizers: for group in opt.param_groups: group["lr"] = group["initial_lr"] * get_lr(step) for group in optimizer2.param_groups: frac = min(step / 300, 1) # momentum warmup for muon group["momentum"] = (1 - frac) * 0.85 + frac * 0.95 # step the optimizers for opt in optimizers: for work in opt2works[opt]: work.wait() opt.step() # null the gradients model.zero_grad(set_to_none=True) # logging approx_training_time_ms = training_time_ms + 1000 * (time.perf_counter() - t0) print0(f"step:{step+1}/{train_steps} train_time:{approx_training_time_ms:.0f}ms step_avg:{approx_training_time_ms/(step + 1):.2f}ms", console=True) print0(f"peak memory allocated: {torch.cuda.max_memory_allocated() // 1024 // 1024} MiB " f"reserved: {torch.cuda.max_memory_reserved() // 1024 // 1024} MiB", console=True) dist.destroy_process_group() ==================================================================================================== Running Python 3.12.9 (main, Feb 5 2025, 19:10:45) [Clang 19.1.6 ] Running PyTorch 2.7.0.dev20250114+cu126 compiled for CUDA 12.6 Fri Mar 28 16:33:32 2025 +---------------------------------------------------------------------------------------+ | NVIDIA-SMI 535.129.03 Driver Version: 535.129.03 CUDA Version: 12.8 | |-----------------------------------------+----------------------+----------------------+ | GPU Name Persistence-M | Bus-Id Disp.A | Volatile Uncorr. ECC | | Fan Temp Perf Pwr:Usage/Cap | Memory-Usage | GPU-Util Compute M. | | | | MIG M. | |=========================================+======================+======================| | 0 NVIDIA H100 80GB HBM3 On | 00000000:65:02.0 Off | 0 | | N/A 36C P0 114W / 700W | 7750MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 1 NVIDIA H100 80GB HBM3 On | 00000000:67:02.0 Off | 0 | | N/A 41C P0 121W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 2 NVIDIA H100 80GB HBM3 On | 00000000:69:02.0 Off | 0 | | N/A 41C P0 126W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 3 NVIDIA H100 80GB HBM3 On | 00000000:6B:02.0 Off | 0 | | N/A 36C P0 118W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 4 NVIDIA H100 80GB HBM3 On | 00000000:6F:02.0 Off | 0 | | N/A 36C P0 116W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 5 NVIDIA H100 80GB HBM3 On | 00000000:71:02.0 Off | 0 | | N/A 41C P0 123W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 6 NVIDIA H100 80GB HBM3 On | 00000000:73:02.0 Off | 0 | | N/A 41C P0 122W / 700W | 3459MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ | 7 NVIDIA H100 80GB HBM3 On | 00000000:75:02.0 Off | 0 | | N/A 34C P0 114W / 700W | 3219MiB / 81559MiB | 0% Default | | | | Disabled | +-----------------------------------------+----------------------+----------------------+ +---------------------------------------------------------------------------------------+ | Processes: | | GPU GI CI PID Type Process name GPU Memory | | ID ID Usage | |=======================================================================================| +---------------------------------------------------------------------------------------+ ==================================================================================================== step:0/6710 val_loss:10.825840 train_time:0ms step_avg:0.02ms Parameter containing: tensor([1., 1., 1., 1., 1., 1., 1., 1.], device='cuda:0', requires_grad=True) 0 [1.0, 0.0] 1 [1.0, 0.0] 2 [1.0, 0.0] 3 [1.0, 0.0] 4 [1.0, 0.0] 5 [1.0, 0.0] 6 [1.0, 0.0] 7 [1.0, 0.0] 8 [1.0, 0.0] 9 [1.0, 0.0] 10 [1.0, 0.0] 11 [1.0, 0.0] 12 [1.0, 0.0] 13 [1.0, 0.0] 14 [1.0, 0.0] 15 [1.0, 0.0] 0 [0.980345606803894, 0.0, 0.0] 1 [0.980345606803894, 0.0, 0.0] 2 [0.980345606803894, 0.0, 0.0] 3 [0.980345606803894, 0.0, 0.0] 4 [0.980345606803894, 0.0, 0.0] 5 [0.980345606803894, 0.0, 0.0] 6 [0.980345606803894, 0.0, 0.0] 7 [0.980345606803894, 0.0, 0.0] 8 [0.980345606803894, 0.0, 0.0] 9 [1.960691213607788, 0.0, 0.0] 10 [2.9410159587860107, 0.0, 0.0] 11 [3.921382427215576, 0.0, 0.0] 12 [3.921382427215576, 0.0, 0.0] 13 [3.921382427215576, 0.0, 0.0] 14 [3.921382427215576, 0.0, 0.0] 15 [3.921382188796997, 0.0, 0.0] step:1/6710 train_time:163ms step_avg:163.04ms step:2/6710 train_time:319ms step_avg:159.46ms step:3/6710 train_time:529ms step_avg:176.18ms step:4/6710 train_time:747ms step_avg:186.78ms step:5/6710 train_time:966ms step_avg:193.28ms step:6/6710 train_time:1186ms step_avg:197.66ms step:7/6710 train_time:1415ms step_avg:202.12ms step:8/6710 train_time:1639ms step_avg:204.87ms step:9/6710 train_time:1861ms step_avg:206.77ms step:10/6710 train_time:2080ms step_avg:208.04ms step:11/6710 train_time:2307ms step_avg:209.72ms step:12/6710 train_time:2533ms step_avg:211.09ms step:13/6710 train_time:2756ms step_avg:211.98ms step:14/6710 train_time:2977ms step_avg:212.64ms step:15/6710 train_time:3200ms step_avg:213.34ms step:16/6710 train_time:3426ms step_avg:214.10ms step:17/6710 train_time:3649ms step_avg:214.64ms step:18/6710 train_time:3871ms step_avg:215.05ms step:19/6710 train_time:4092ms step_avg:215.37ms step:20/6710 train_time:4315ms step_avg:215.76ms step:21/6710 train_time:4542ms step_avg:216.29ms step:22/6710 train_time:4766ms step_avg:216.64ms step:23/6710 train_time:4988ms step_avg:216.87ms step:24/6710 train_time:5210ms step_avg:217.10ms step:25/6710 train_time:5432ms step_avg:217.29ms step:26/6710 train_time:5656ms step_avg:217.55ms step:27/6710 train_time:5880ms step_avg:217.77ms step:28/6710 train_time:6103ms step_avg:217.96ms step:29/6710 train_time:6326ms step_avg:218.14ms step:30/6710 train_time:6549ms step_avg:218.29ms step:31/6710 train_time:6771ms step_avg:218.41ms step:32/6710 train_time:6991ms step_avg:218.48ms step:33/6710 train_time:7215ms step_avg:218.63ms step:34/6710 train_time:7438ms step_avg:218.76ms step:35/6710 train_time:7661ms step_avg:218.87ms step:36/6710 train_time:7882ms step_avg:218.95ms step:37/6710 train_time:8104ms step_avg:219.04ms step:38/6710 train_time:8328ms step_avg:219.16ms step:39/6710 train_time:8550ms step_avg:219.24ms step:40/6710 train_time:8772ms step_avg:219.30ms step:41/6710 train_time:8993ms step_avg:219.35ms step:42/6710 train_time:9215ms step_avg:219.41ms step:43/6710 train_time:9439ms step_avg:219.51ms step:44/6710 train_time:9662ms step_avg:219.59ms step:45/6710 train_time:9883ms step_avg:219.62ms step:46/6710 train_time:10105ms step_avg:219.68ms step:47/6710 train_time:10327ms step_avg:219.73ms step:48/6710 train_time:10549ms step_avg:219.77ms step:49/6710 train_time:10769ms step_avg:219.79ms step:50/6710 train_time:10991ms step_avg:219.81ms step:51/6710 train_time:11212ms step_avg:219.84ms step:52/6710 train_time:11434ms step_avg:219.88ms step:53/6710 train_time:11656ms step_avg:219.93ms step:54/6710 train_time:11879ms step_avg:219.98ms step:55/6710 train_time:12102ms step_avg:220.03ms step:56/6710 train_time:12324ms step_avg:220.07ms step:57/6710 train_time:12546ms step_avg:220.11ms step:58/6710 train_time:12768ms step_avg:220.14ms step:59/6710 train_time:12990ms step_avg:220.18ms step:60/6710 train_time:13213ms step_avg:220.22ms step:61/6710 train_time:13433ms step_avg:220.22ms step:62/6710 train_time:13656ms step_avg:220.25ms step:63/6710 train_time:13877ms step_avg:220.27ms step:64/6710 train_time:14099ms step_avg:220.30ms step:65/6710 train_time:14321ms step_avg:220.33ms step:66/6710 train_time:14544ms step_avg:220.36ms step:67/6710 train_time:14766ms step_avg:220.39ms step:68/6710 train_time:14988ms step_avg:220.42ms step:69/6710 train_time:15209ms step_avg:220.42ms step:70/6710 train_time:15430ms step_avg:220.43ms step:71/6710 train_time:15651ms step_avg:220.44ms step:72/6710 train_time:15872ms step_avg:220.44ms step:73/6710 train_time:16093ms step_avg:220.45ms step:74/6710 train_time:16314ms step_avg:220.46ms step:75/6710 train_time:16535ms step_avg:220.47ms step:76/6710 train_time:16755ms step_avg:220.47ms step:77/6710 train_time:16976ms step_avg:220.47ms step:78/6710 train_time:17197ms step_avg:220.48ms step:79/6710 train_time:17421ms step_avg:220.52ms step:80/6710 train_time:17642ms step_avg:220.53ms step:81/6710 train_time:17865ms step_avg:220.56ms step:82/6710 train_time:18087ms step_avg:220.57ms step:83/6710 train_time:18308ms step_avg:220.57ms step:84/6710 train_time:18529ms step_avg:220.59ms step:85/6710 train_time:18751ms step_avg:220.59ms step:86/6710 train_time:18972ms step_avg:220.60ms step:87/6710 train_time:19194ms step_avg:220.62ms step:88/6710 train_time:19415ms step_avg:220.63ms step:89/6710 train_time:19637ms step_avg:220.64ms step:90/6710 train_time:19859ms step_avg:220.65ms step:91/6710 train_time:20080ms step_avg:220.66ms step:92/6710 train_time:20303ms step_avg:220.68ms step:93/6710 train_time:20524ms step_avg:220.69ms step:94/6710 train_time:20746ms step_avg:220.71ms step:95/6710 train_time:20967ms step_avg:220.71ms step:96/6710 train_time:21188ms step_avg:220.71ms step:97/6710 train_time:21409ms step_avg:220.71ms step:98/6710 train_time:21630ms step_avg:220.71ms step:99/6710 train_time:21851ms step_avg:220.71ms step:100/6710 train_time:22070ms step_avg:220.70ms step:101/6710 train_time:22292ms step_avg:220.71ms step:102/6710 train_time:22513ms step_avg:220.72ms step:103/6710 train_time:22735ms step_avg:220.72ms step:104/6710 train_time:22957ms step_avg:220.74ms step:105/6710 train_time:23176ms step_avg:220.72ms step:106/6710 train_time:23398ms step_avg:220.74ms step:107/6710 train_time:23620ms step_avg:220.75ms step:108/6710 train_time:23842ms step_avg:220.76ms step:109/6710 train_time:24063ms step_avg:220.76ms step:110/6710 train_time:24285ms step_avg:220.77ms step:111/6710 train_time:24506ms step_avg:220.78ms step:112/6710 train_time:24730ms step_avg:220.80ms step:113/6710 train_time:24950ms step_avg:220.80ms step:114/6710 train_time:25171ms step_avg:220.80ms step:115/6710 train_time:25392ms step_avg:220.80ms step:116/6710 train_time:25612ms step_avg:220.79ms step:117/6710 train_time:25835ms step_avg:220.81ms step:118/6710 train_time:26055ms step_avg:220.80ms step:119/6710 train_time:26276ms step_avg:220.81ms step:120/6710 train_time:26499ms step_avg:220.82ms step:121/6710 train_time:26721ms step_avg:220.83ms step:122/6710 train_time:26943ms step_avg:220.84ms step:123/6710 train_time:27163ms step_avg:220.83ms step:124/6710 train_time:27384ms step_avg:220.84ms step:125/6710 train_time:27605ms step_avg:220.84ms step:125/6710 val_loss:4.509298 train_time:27779ms step_avg:222.23ms Parameter containing: tensor([1.0000, 1.0000, 0.9893, 1.0000, 0.8621, 1.0000, 0.8154, 1.0000], device='cuda:0', requires_grad=True) 0 [1.0406980514526367, 0.04069794714450836] 1 [0.9171246290206909, 0.07475923001766205] 2 [0.8688899278640747, 0.1271146982908249] 3 [0.7313400506973267, 0.16463859379291534] 4 [0.7770416736602783, 0.160187229514122] 5 [0.68061763048172, 0.1461925208568573] 6 [0.7479856610298157, 0.1680511087179184] 7 [0.7724498510360718, 0.15360446274280548] 8 [0.684529721736908, 0.18712468445301056] 9 [0.7419437170028687, 0.194843590259552] 10 [0.8086865544319153, 0.19345125555992126] 11 [0.912903904914856, 0.19378338754177094] 12 [0.9024471044540405, 0.19586491584777832] 13 [0.8786758780479431, 0.19964517652988434] 14 [0.9019429683685303, 0.21212206780910492] 15 [0.9047420620918274, 0.21505317091941833] 0 [1.0777493715286255, 0.7736283540725708, 0.7414581179618835] 1 [1.6722455024719238, 0.965424120426178, 0.7644904851913452] 2 [2.213808536529541, 1.2323780059814453, 0.5499558448791504] 3 [2.2552359104156494, 0.5630378723144531, 0.7114850282669067] 4 [2.2561328411102295, 0.4875413775444031, 0.650216281414032] 5 [1.941368818283081, 0.58622145652771, 0.8047398924827576] 6 [2.0531394481658936, 0.5305519104003906, 0.8134761452674866] 7 [2.168478488922119, 0.0, 0.9564886689186096] 8 [1.9608103036880493, 0.5539873838424683, 1.1135700941085815] 9 [3.716508150100708, 0.4940166473388672, 1.0091291666030884] 10 [5.282750606536865, 0.44392871856689453, 0.8157856464385986] 11 [7.551239967346191, 0.4011285901069641, 0.6533820033073425] 12 [7.216255187988281, 0.39262455701828003, 0.7007722854614258] 13 [6.762092113494873, 1.250331163406372, 0.715566098690033] 14 [6.724518299102783, 1.1978039741516113, 0.8488454222679138] 15 [6.762991428375244, 1.140478253364563, 1.0704455375671387] step:126/6710 train_time:27825ms step_avg:220.84ms step:127/6710 train_time:28043ms step_avg:220.81ms step:128/6710 train_time:28271ms step_avg:220.87ms step:129/6710 train_time:28493ms step_avg:220.88ms step:130/6710 train_time:28714ms step_avg:220.87ms step:131/6710 train_time:28938ms step_avg:220.90ms step:132/6710 train_time:29159ms step_avg:220.90ms step:133/6710 train_time:29381ms step_avg:220.91ms step:134/6710 train_time:29602ms step_avg:220.91ms step:135/6710 train_time:29824ms step_avg:220.92ms step:136/6710 train_time:30043ms step_avg:220.91ms step:137/6710 train_time:30265ms step_avg:220.92ms step:138/6710 train_time:30487ms step_avg:220.92ms step:139/6710 train_time:30707ms step_avg:220.92ms step:140/6710 train_time:30928ms step_avg:220.92ms step:141/6710 train_time:31150ms step_avg:220.92ms step:142/6710 train_time:31371ms step_avg:220.93ms step:143/6710 train_time:31593ms step_avg:220.93ms step:144/6710 train_time:31813ms step_avg:220.92ms step:145/6710 train_time:32034ms step_avg:220.92ms step:146/6710 train_time:32254ms step_avg:220.92ms step:147/6710 train_time:32475ms step_avg:220.92ms step:148/6710 train_time:32696ms step_avg:220.92ms step:149/6710 train_time:32915ms step_avg:220.91ms step:150/6710 train_time:33138ms step_avg:220.92ms step:151/6710 train_time:33359ms step_avg:220.92ms step:152/6710 train_time:33580ms step_avg:220.92ms step:153/6710 train_time:33801ms step_avg:220.92ms step:154/6710 train_time:34023ms step_avg:220.93ms step:155/6710 train_time:34242ms step_avg:220.92ms step:156/6710 train_time:34463ms step_avg:220.92ms step:157/6710 train_time:34683ms step_avg:220.91ms step:158/6710 train_time:34904ms step_avg:220.91ms step:159/6710 train_time:35124ms step_avg:220.91ms step:160/6710 train_time:35344ms step_avg:220.90ms step:161/6710 train_time:35564ms step_avg:220.89ms step:162/6710 train_time:35785ms step_avg:220.89ms step:163/6710 train_time:36005ms step_avg:220.89ms step:164/6710 train_time:36226ms step_avg:220.89ms step:165/6710 train_time:36445ms step_avg:220.88ms step:166/6710 train_time:36665ms step_avg:220.88ms step:167/6710 train_time:36886ms step_avg:220.87ms step:168/6710 train_time:37106ms step_avg:220.87ms step:169/6710 train_time:37325ms step_avg:220.86ms step:170/6710 train_time:37545ms step_avg:220.85ms step:171/6710 train_time:37765ms step_avg:220.85ms step:172/6710 train_time:37987ms step_avg:220.85ms step:173/6710 train_time:38207ms step_avg:220.85ms step:174/6710 train_time:38427ms step_avg:220.84ms step:175/6710 train_time:38645ms step_avg:220.83ms step:176/6710 train_time:38865ms step_avg:220.82ms step:177/6710 train_time:39085ms step_avg:220.82ms step:178/6710 train_time:39305ms step_avg:220.82ms step:179/6710 train_time:39525ms step_avg:220.81ms step:180/6710 train_time:39744ms step_avg:220.80ms step:181/6710 train_time:39964ms step_avg:220.80ms step:182/6710 train_time:40184ms step_avg:220.79ms step:183/6710 train_time:40405ms step_avg:220.79ms step:184/6710 train_time:40624ms step_avg:220.78ms step:185/6710 train_time:40842ms step_avg:220.77ms step:186/6710 train_time:41063ms step_avg:220.77ms step:187/6710 train_time:41286ms step_avg:220.78ms step:188/6710 train_time:41504ms step_avg:220.77ms step:189/6710 train_time:41722ms step_avg:220.75ms step:190/6710 train_time:41942ms step_avg:220.75ms step:191/6710 train_time:42164ms step_avg:220.75ms step:192/6710 train_time:42385ms step_avg:220.76ms step:193/6710 train_time:42607ms step_avg:220.76ms step:194/6710 train_time:42825ms step_avg:220.75ms step:195/6710 train_time:43044ms step_avg:220.74ms step:196/6710 train_time:43266ms step_avg:220.74ms step:197/6710 train_time:43485ms step_avg:220.74ms step:198/6710 train_time:43705ms step_avg:220.73ms step:199/6710 train_time:43923ms step_avg:220.72ms step:200/6710 train_time:44143ms step_avg:220.71ms step:201/6710 train_time:44366ms step_avg:220.73ms step:202/6710 train_time:44585ms step_avg:220.72ms step:203/6710 train_time:44805ms step_avg:220.71ms step:204/6710 train_time:45024ms step_avg:220.71ms step:205/6710 train_time:45245ms step_avg:220.71ms step:206/6710 train_time:45466ms step_avg:220.71ms step:207/6710 train_time:45686ms step_avg:220.70ms step:208/6710 train_time:45905ms step_avg:220.70ms step:209/6710 train_time:46125ms step_avg:220.69ms step:210/6710 train_time:46345ms step_avg:220.69ms step:211/6710 train_time:46565ms step_avg:220.69ms step:212/6710 train_time:46786ms step_avg:220.69ms step:213/6710 train_time:47005ms step_avg:220.68ms step:214/6710 train_time:47225ms step_avg:220.68ms step:215/6710 train_time:47444ms step_avg:220.67ms step:216/6710 train_time:47664ms step_avg:220.67ms step:217/6710 train_time:47884ms step_avg:220.66ms step:218/6710 train_time:48103ms step_avg:220.66ms step:219/6710 train_time:48323ms step_avg:220.65ms step:220/6710 train_time:48544ms step_avg:220.66ms step:221/6710 train_time:48766ms step_avg:220.66ms step:222/6710 train_time:48985ms step_avg:220.65ms step:223/6710 train_time:49203ms step_avg:220.64ms step:224/6710 train_time:49423ms step_avg:220.64ms step:225/6710 train_time:49642ms step_avg:220.63ms step:226/6710 train_time:49863ms step_avg:220.63ms step:227/6710 train_time:50083ms step_avg:220.63ms step:228/6710 train_time:50302ms step_avg:220.62ms step:229/6710 train_time:50522ms step_avg:220.62ms step:230/6710 train_time:50742ms step_avg:220.62ms step:231/6710 train_time:50962ms step_avg:220.61ms step:232/6710 train_time:51183ms step_avg:220.62ms step:233/6710 train_time:51401ms step_avg:220.61ms step:234/6710 train_time:51622ms step_avg:220.61ms step:235/6710 train_time:51844ms step_avg:220.61ms step:236/6710 train_time:52065ms step_avg:220.61ms step:237/6710 train_time:52284ms step_avg:220.61ms step:238/6710 train_time:52503ms step_avg:220.60ms step:239/6710 train_time:52724ms step_avg:220.60ms step:240/6710 train_time:52943ms step_avg:220.59ms step:241/6710 train_time:53163ms step_avg:220.59ms step:242/6710 train_time:53383ms step_avg:220.59ms step:243/6710 train_time:53603ms step_avg:220.59ms step:244/6710 train_time:53824ms step_avg:220.59ms step:245/6710 train_time:54044ms step_avg:220.59ms step:246/6710 train_time:54263ms step_avg:220.58ms step:247/6710 train_time:54484ms step_avg:220.58ms step:248/6710 train_time:54703ms step_avg:220.58ms step:249/6710 train_time:54923ms step_avg:220.57ms step:250/6710 train_time:55143ms step_avg:220.57ms step:250/6710 val_loss:4.185414 train_time:55318ms step_avg:221.27ms Parameter containing: tensor([1.0000, 1.0000, 0.8591, 1.0000, 0.6976, 1.0000, 0.7600, 1.0000], device='cuda:0', requires_grad=True) 0 [1.2591508626937866, 0.2591504454612732] 1 [0.7913157939910889, 0.34785136580467224] 2 [0.787757158279419, 0.3243969976902008] 3 [0.5691148042678833, 0.2990681231021881] 4 [0.6629195213317871, 0.27020859718322754] 5 [0.6057382822036743, 0.2293466180562973] 6 [0.6742076277732849, 0.3068026602268219] 7 [0.7405307292938232, 0.29312679171562195] 8 [0.5663794279098511, 0.35536181926727295] 9 [0.7378698587417603, 0.365424782037735] 10 [0.7779419422149658, 0.33428728580474854] 11 [0.8615737557411194, 0.31886520981788635] 12 [0.8783013820648193, 0.3174259066581726] 13 [0.8752872347831726, 0.3205696642398834] 14 [0.9289514422416687, 0.381246417760849] 15 [0.9243648052215576, 0.37441354990005493] 0 [1.5060168504714966, 1.524865984916687, 1.7241809368133545] 1 [2.8530688285827637, 1.9965564012527466, 1.7455836534500122] 2 [3.9700136184692383, 2.1521875858306885, 1.3002657890319824] 3 [3.276289224624634, 1.133551001548767, 1.6886382102966309] 4 [3.2565720081329346, 0.9799519181251526, 1.476282000541687] 5 [2.810539484024048, 1.2214446067810059, 1.7393072843551636] 6 [3.1487131118774414, 1.1968308687210083, 1.5500798225402832] 7 [3.532693386077881, 0.0, 2.2679879665374756] 8 [2.9239656925201416, 1.4364036321640015, 2.379354476928711] 9 [6.127072334289551, 1.2789170742034912, 2.179577350616455] 10 [8.069775581359863, 1.0785698890686035, 1.8096864223480225] 11 [11.170607566833496, 0.8777099847793579, 1.5300019979476929] 12 [10.637754440307617, 0.9373247027397156, 1.5224261283874512] 13 [10.170358657836914, 2.459062337875366, 1.6228586435317993] 14 [10.644953727722168, 2.3631765842437744, 2.09011173248291] 15 [11.146924018859863, 2.566683053970337, 3.6219778060913086] step:251/6710 train_time:55365ms step_avg:220.58ms step:252/6710 train_time:55582ms step_avg:220.56ms step:253/6710 train_time:55803ms step_avg:220.57ms step:254/6710 train_time:56028ms step_avg:220.58ms step:255/6710 train_time:56247ms step_avg:220.58ms step:256/6710 train_time:56470ms step_avg:220.59ms step:257/6710 train_time:56687ms step_avg:220.57ms step:258/6710 train_time:56909ms step_avg:220.58ms step:259/6710 train_time:57130ms step_avg:220.58ms step:260/6710 train_time:57350ms step_avg:220.58ms step:261/6710 train_time:57571ms step_avg:220.58ms step:262/6710 train_time:57789ms step_avg:220.57ms step:263/6710 train_time:58010ms step_avg:220.57ms step:264/6710 train_time:58229ms step_avg:220.57ms step:265/6710 train_time:58451ms step_avg:220.57ms step:266/6710 train_time:58670ms step_avg:220.56ms step:267/6710 train_time:58889ms step_avg:220.56ms step:268/6710 train_time:59109ms step_avg:220.56ms step:269/6710 train_time:59329ms step_avg:220.55ms step:270/6710 train_time:59549ms step_avg:220.55ms step:271/6710 train_time:59769ms step_avg:220.55ms step:272/6710 train_time:59989ms step_avg:220.55ms step:273/6710 train_time:60209ms step_avg:220.55ms step:274/6710 train_time:60428ms step_avg:220.54ms step:275/6710 train_time:60647ms step_avg:220.54ms step:276/6710 train_time:60868ms step_avg:220.54ms step:277/6710 train_time:61089ms step_avg:220.54ms step:278/6710 train_time:61311ms step_avg:220.54ms step:279/6710 train_time:61529ms step_avg:220.54ms step:280/6710 train_time:61749ms step_avg:220.53ms step:281/6710 train_time:61969ms step_avg:220.53ms step:282/6710 train_time:62189ms step_avg:220.53ms step:283/6710 train_time:62408ms step_avg:220.52ms step:284/6710 train_time:62628ms step_avg:220.52ms step:285/6710 train_time:62849ms step_avg:220.52ms step:286/6710 train_time:63070ms step_avg:220.53ms step:287/6710 train_time:63290ms step_avg:220.52ms step:288/6710 train_time:63508ms step_avg:220.51ms step:289/6710 train_time:63728ms step_avg:220.51ms step:290/6710 train_time:63949ms step_avg:220.51ms step:291/6710 train_time:64169ms step_avg:220.51ms step:292/6710 train_time:64388ms step_avg:220.51ms step:293/6710 train_time:64609ms step_avg:220.51ms step:294/6710 train_time:64829ms step_avg:220.51ms step:295/6710 train_time:65050ms step_avg:220.51ms step:296/6710 train_time:65269ms step_avg:220.50ms step:297/6710 train_time:65489ms step_avg:220.50ms step:298/6710 train_time:65709ms step_avg:220.50ms step:299/6710 train_time:65927ms step_avg:220.49ms step:300/6710 train_time:66149ms step_avg:220.50ms step:301/6710 train_time:66368ms step_avg:220.49ms step:302/6710 train_time:66589ms step_avg:220.49ms step:303/6710 train_time:66808ms step_avg:220.49ms step:304/6710 train_time:67029ms step_avg:220.49ms step:305/6710 train_time:67250ms step_avg:220.49ms step:306/6710 train_time:67468ms step_avg:220.48ms step:307/6710 train_time:67689ms step_avg:220.49ms step:308/6710 train_time:67908ms step_avg:220.48ms step:309/6710 train_time:68129ms step_avg:220.48ms step:310/6710 train_time:68350ms step_avg:220.48ms step:311/6710 train_time:68570ms step_avg:220.48ms step:312/6710 train_time:68789ms step_avg:220.48ms step:313/6710 train_time:69008ms step_avg:220.47ms step:314/6710 train_time:69228ms step_avg:220.47ms step:315/6710 train_time:69448ms step_avg:220.47ms step:316/6710 train_time:69669ms step_avg:220.47ms step:317/6710 train_time:69888ms step_avg:220.47ms step:318/6710 train_time:70108ms step_avg:220.46ms step:319/6710 train_time:70327ms step_avg:220.46ms step:320/6710 train_time:70547ms step_avg:220.46ms step:321/6710 train_time:70767ms step_avg:220.46ms step:322/6710 train_time:70987ms step_avg:220.46ms step:323/6710 train_time:71207ms step_avg:220.46ms step:324/6710 train_time:71427ms step_avg:220.45ms step:325/6710 train_time:71648ms step_avg:220.45ms step:326/6710 train_time:71868ms step_avg:220.45ms step:327/6710 train_time:72087ms step_avg:220.45ms step:328/6710 train_time:72306ms step_avg:220.45ms step:329/6710 train_time:72527ms step_avg:220.45ms step:330/6710 train_time:72747ms step_avg:220.44ms step:331/6710 train_time:72968ms step_avg:220.45ms step:332/6710 train_time:73188ms step_avg:220.44ms step:333/6710 train_time:73408ms step_avg:220.44ms step:334/6710 train_time:73627ms step_avg:220.44ms step:335/6710 train_time:73847ms step_avg:220.44ms step:336/6710 train_time:74067ms step_avg:220.44ms step:337/6710 train_time:74288ms step_avg:220.44ms step:338/6710 train_time:74509ms step_avg:220.44ms step:339/6710 train_time:74728ms step_avg:220.44ms step:340/6710 train_time:74949ms step_avg:220.44ms step:341/6710 train_time:75168ms step_avg:220.43ms step:342/6710 train_time:75389ms step_avg:220.43ms step:343/6710 train_time:75609ms step_avg:220.43ms step:344/6710 train_time:75828ms step_avg:220.43ms step:345/6710 train_time:76048ms step_avg:220.43ms step:346/6710 train_time:76269ms step_avg:220.43ms step:347/6710 train_time:76490ms step_avg:220.43ms step:348/6710 train_time:76710ms step_avg:220.43ms step:349/6710 train_time:76929ms step_avg:220.43ms step:350/6710 train_time:77149ms step_avg:220.43ms step:351/6710 train_time:77369ms step_avg:220.42ms step:352/6710 train_time:77589ms step_avg:220.42ms step:353/6710 train_time:77809ms step_avg:220.42ms step:354/6710 train_time:78028ms step_avg:220.42ms step:355/6710 train_time:78247ms step_avg:220.42ms step:356/6710 train_time:78469ms step_avg:220.42ms step:357/6710 train_time:78688ms step_avg:220.42ms step:358/6710 train_time:78908ms step_avg:220.41ms step:359/6710 train_time:79128ms step_avg:220.41ms step:360/6710 train_time:79348ms step_avg:220.41ms step:361/6710 train_time:79569ms step_avg:220.41ms step:362/6710 train_time:79788ms step_avg:220.41ms step:363/6710 train_time:80008ms step_avg:220.41ms step:364/6710 train_time:80227ms step_avg:220.40ms step:365/6710 train_time:80449ms step_avg:220.41ms step:366/6710 train_time:80668ms step_avg:220.40ms step:367/6710 train_time:80888ms step_avg:220.40ms step:368/6710 train_time:81107ms step_avg:220.40ms step:369/6710 train_time:81327ms step_avg:220.40ms step:370/6710 train_time:81548ms step_avg:220.40ms step:371/6710 train_time:81768ms step_avg:220.40ms step:372/6710 train_time:81989ms step_avg:220.40ms step:373/6710 train_time:82207ms step_avg:220.39ms step:374/6710 train_time:82426ms step_avg:220.39ms step:375/6710 train_time:82647ms step_avg:220.39ms step:375/6710 val_loss:4.041555 train_time:82821ms step_avg:220.86ms Parameter containing: tensor([1.0000, 1.0000, 0.7645, 1.0000, 0.5846, 1.0000, 0.7357, 1.0000], device='cuda:0', requires_grad=True) 0 [1.6403642892837524, 0.6403639316558838] 1 [0.7142341732978821, 0.7813425064086914] 2 [0.7732452750205994, 0.6773967146873474] 3 [0.5972092747688293, 0.5055809020996094] 4 [0.6416104435920715, 0.49456584453582764] 5 [0.5903162360191345, 0.41927197575569153] 6 [0.633057713508606, 0.5464056730270386] 7 [0.8407480716705322, 0.5849569439888] 8 [0.4531615972518921, 0.5970875024795532] 9 [0.7167664170265198, 0.6849685311317444] 10 [0.7568789720535278, 0.6598384380340576] 11 [0.8235663175582886, 0.6303218603134155] 12 [0.8741365671157837, 0.6118046045303345] 13 [0.8992729187011719, 0.6026722192764282] 14 [0.9705013632774353, 0.7270904183387756] 15 [0.9796665906906128, 0.6950669884681702] 0 [2.2600810527801514, 3.012939691543579, 3.4117865562438965] 1 [4.930606365203857, 3.748314142227173, 3.5572383403778076] 2 [7.367373943328857, 3.7372679710388184, 2.764357805252075] 3 [6.450159072875977, 2.2893636226654053, 3.73606276512146] 4 [6.471477031707764, 2.0940606594085693, 3.243194580078125] 5 [5.659660339355469, 2.565053939819336, 3.6205813884735107] 6 [6.088792324066162, 2.599027633666992, 3.098667860031128] 7 [8.022628784179688, 0.0, 5.3272576332092285] 8 [5.336169719696045, 3.0586445331573486, 4.912380695343018] 9 [11.694649696350098, 2.713809013366699, 4.435400009155273] 10 [14.94261360168457, 2.344195604324341, 3.8126909732818604] 11 [19.66762924194336, 1.8856971263885498, 3.2745018005371094] 12 [19.05699920654297, 2.096156597137451, 3.2492668628692627] 13 [19.126314163208008, 4.61470890045166, 3.639371156692505] 14 [21.1341609954834, 4.753126621246338, 5.140233993530273] 15 [23.72291374206543, 5.698940753936768, 9.987494468688965] step:376/6710 train_time:82868ms step_avg:220.39ms step:377/6710 train_time:83084ms step_avg:220.38ms step:378/6710 train_time:83306ms step_avg:220.39ms step:379/6710 train_time:83525ms step_avg:220.38ms step:380/6710 train_time:83743ms step_avg:220.38ms step:381/6710 train_time:83965ms step_avg:220.38ms step:382/6710 train_time:84182ms step_avg:220.37ms step:383/6710 train_time:84401ms step_avg:220.37ms step:384/6710 train_time:84620ms step_avg:220.36ms step:385/6710 train_time:84840ms step_avg:220.36ms step:386/6710 train_time:85059ms step_avg:220.36ms step:387/6710 train_time:85279ms step_avg:220.36ms step:388/6710 train_time:85499ms step_avg:220.36ms step:389/6710 train_time:85718ms step_avg:220.36ms step:390/6710 train_time:85938ms step_avg:220.35ms step:391/6710 train_time:86158ms step_avg:220.35ms step:392/6710 train_time:86377ms step_avg:220.35ms step:393/6710 train_time:86598ms step_avg:220.35ms step:394/6710 train_time:86816ms step_avg:220.35ms step:395/6710 train_time:87037ms step_avg:220.35ms step:396/6710 train_time:87258ms step_avg:220.35ms step:397/6710 train_time:87476ms step_avg:220.34ms step:398/6710 train_time:87696ms step_avg:220.34ms step:399/6710 train_time:87916ms step_avg:220.34ms step:400/6710 train_time:88135ms step_avg:220.34ms step:401/6710 train_time:88355ms step_avg:220.34ms step:402/6710 train_time:88575ms step_avg:220.33ms step:403/6710 train_time:88795ms step_avg:220.33ms step:404/6710 train_time:89014ms step_avg:220.33ms step:405/6710 train_time:89235ms step_avg:220.33ms step:406/6710 train_time:89455ms step_avg:220.33ms step:407/6710 train_time:89674ms step_avg:220.33ms step:408/6710 train_time:89894ms step_avg:220.33ms step:409/6710 train_time:90114ms step_avg:220.33ms step:410/6710 train_time:90334ms step_avg:220.33ms step:411/6710 train_time:90554ms step_avg:220.33ms step:412/6710 train_time:90775ms step_avg:220.33ms step:413/6710 train_time:90994ms step_avg:220.32ms step:414/6710 train_time:91214ms step_avg:220.32ms step:415/6710 train_time:91434ms step_avg:220.32ms step:416/6710 train_time:91655ms step_avg:220.32ms step:417/6710 train_time:91874ms step_avg:220.32ms step:418/6710 train_time:92093ms step_avg:220.32ms step:419/6710 train_time:92314ms step_avg:220.32ms step:420/6710 train_time:92534ms step_avg:220.32ms step:421/6710 train_time:92755ms step_avg:220.32ms step:422/6710 train_time:92976ms step_avg:220.32ms step:423/6710 train_time:93195ms step_avg:220.32ms step:424/6710 train_time:93415ms step_avg:220.32ms step:425/6710 train_time:93635ms step_avg:220.32ms step:426/6710 train_time:93856ms step_avg:220.32ms step:427/6710 train_time:94075ms step_avg:220.32ms step:428/6710 train_time:94294ms step_avg:220.31ms step:429/6710 train_time:94514ms step_avg:220.31ms step:430/6710 train_time:94734ms step_avg:220.31ms step:431/6710 train_time:94955ms step_avg:220.31ms step:432/6710 train_time:95176ms step_avg:220.32ms step:433/6710 train_time:95396ms step_avg:220.31ms step:434/6710 train_time:95615ms step_avg:220.31ms step:435/6710 train_time:95835ms step_avg:220.31ms step:436/6710 train_time:96056ms step_avg:220.31ms step:437/6710 train_time:96276ms step_avg:220.31ms step:438/6710 train_time:96495ms step_avg:220.31ms step:439/6710 train_time:96715ms step_avg:220.31ms step:440/6710 train_time:96935ms step_avg:220.31ms step:441/6710 train_time:97155ms step_avg:220.31ms step:442/6710 train_time:97374ms step_avg:220.30ms step:443/6710 train_time:97595ms step_avg:220.30ms step:444/6710 train_time:97814ms step_avg:220.30ms step:445/6710 train_time:98035ms step_avg:220.30ms step:446/6710 train_time:98255ms step_avg:220.30ms step:447/6710 train_time:98474ms step_avg:220.30ms step:448/6710 train_time:98695ms step_avg:220.30ms step:449/6710 train_time:98913ms step_avg:220.30ms step:450/6710 train_time:99134ms step_avg:220.30ms step:451/6710 train_time:99354ms step_avg:220.30ms step:452/6710 train_time:99574ms step_avg:220.30ms step:453/6710 train_time:99793ms step_avg:220.29ms step:454/6710 train_time:100014ms step_avg:220.29ms step:455/6710 train_time:100235ms step_avg:220.30ms step:456/6710 train_time:100456ms step_avg:220.30ms step:457/6710 train_time:100676ms step_avg:220.30ms step:458/6710 train_time:100895ms step_avg:220.30ms step:459/6710 train_time:101115ms step_avg:220.29ms step:460/6710 train_time:101336ms step_avg:220.30ms step:461/6710 train_time:101556ms step_avg:220.30ms step:462/6710 train_time:101775ms step_avg:220.29ms step:463/6710 train_time:101994ms step_avg:220.29ms step:464/6710 train_time:102214ms step_avg:220.29ms step:465/6710 train_time:102435ms step_avg:220.29ms step:466/6710 train_time:102655ms step_avg:220.29ms step:467/6710 train_time:102877ms step_avg:220.29ms step:468/6710 train_time:103096ms step_avg:220.29ms step:469/6710 train_time:103314ms step_avg:220.29ms step:470/6710 train_time:103535ms step_avg:220.29ms step:471/6710 train_time:103756ms step_avg:220.29ms step:472/6710 train_time:103976ms step_avg:220.29ms step:473/6710 train_time:104195ms step_avg:220.29ms step:474/6710 train_time:104414ms step_avg:220.28ms step:475/6710 train_time:104636ms step_avg:220.29ms step:476/6710 train_time:104856ms step_avg:220.29ms step:477/6710 train_time:105077ms step_avg:220.29ms step:478/6710 train_time:105294ms step_avg:220.28ms step:479/6710 train_time:105512ms step_avg:220.28ms step:480/6710 train_time:105734ms step_avg:220.28ms step:481/6710 train_time:105955ms step_avg:220.28ms step:482/6710 train_time:106175ms step_avg:220.28ms step:483/6710 train_time:106393ms step_avg:220.28ms step:484/6710 train_time:106612ms step_avg:220.27ms step:485/6710 train_time:106834ms step_avg:220.28ms step:486/6710 train_time:107054ms step_avg:220.28ms step:487/6710 train_time:107274ms step_avg:220.28ms step:488/6710 train_time:107493ms step_avg:220.27ms step:489/6710 train_time:107712ms step_avg:220.27ms step:490/6710 train_time:107934ms step_avg:220.27ms step:491/6710 train_time:108154ms step_avg:220.27ms step:492/6710 train_time:108375ms step_avg:220.27ms step:493/6710 train_time:108594ms step_avg:220.27ms step:494/6710 train_time:108814ms step_avg:220.27ms step:495/6710 train_time:109037ms step_avg:220.28ms step:496/6710 train_time:109258ms step_avg:220.28ms step:497/6710 train_time:109476ms step_avg:220.27ms step:498/6710 train_time:109695ms step_avg:220.27ms step:499/6710 train_time:109914ms step_avg:220.27ms step:500/6710 train_time:110137ms step_avg:220.27ms step:500/6710 val_loss:3.873065 train_time:110312ms step_avg:220.62ms Parameter containing: tensor([1.0000, 1.0000, 0.7113, 1.0000, 0.5183, 1.0000, 0.7136, 1.0000], device='cuda:0', requires_grad=True) 0 [2.0288126468658447, 1.028812050819397] 1 [0.6784067749977112, 1.2298516035079956] 2 [0.79427570104599, 1.0405545234680176] 3 [0.619644820690155, 0.7392706274986267] 4 [0.6145538687705994, 0.7425358891487122] 5 [0.5804263353347778, 0.6234272718429565] 6 [0.6061234474182129, 0.8066515922546387] 7 [0.9029082655906677, 0.9406315684318542] 8 [0.3975716829299927, 0.8296146392822266] 9 [0.6899359226226807, 0.9969456195831299] 10 [0.7434765100479126, 1.0073788166046143] 11 [0.7932745218276978, 0.9839494228363037] 12 [0.8763079643249512, 0.9328910708427429] 13 [0.9294247031211853, 0.9061650633811951] 14 [0.9938780665397644, 1.104880690574646] 15 [1.0047916173934937, 1.0525201559066772] 0 [3.0353991985321045, 4.6062912940979, 4.877889633178711] 1 [6.951062202453613, 5.7469329833984375, 5.254223346710205] 2 [11.201369285583496, 5.362180709838867, 4.301965236663818] 3 [10.186087608337402, 3.822310209274292, 6.132099151611328] 4 [10.01717472076416, 3.2931861877441406, 5.195462226867676] 5 [8.781847953796387, 4.339366436004639, 5.827611923217773] 6 [9.331497192382812, 4.332347393035889, 4.895348072052002] 7 [13.582233428955078, 0.0, 8.788206100463867] 8 [7.842392921447754, 5.1465044021606445, 7.562027931213379] 9 [17.418155670166016, 4.592250823974609, 6.7301859855651855] 10 [22.010597229003906, 3.917954206466675, 5.963293552398682] 11 [28.209341049194336, 2.797271251678467, 4.791940212249756] 12 [27.627361297607422, 3.510878086090088, 4.766870021820068] 13 [28.91014289855957, 7.272332668304443, 5.687243938446045] 14 [32.84548568725586, 7.786647796630859, 9.114116668701172] 15 [37.94533157348633, 9.570388793945312, 17.435897827148438] step:501/6710 train_time:110359ms step_avg:220.28ms step:502/6710 train_time:110576ms step_avg:220.27ms step:503/6710 train_time:110801ms step_avg:220.28ms step:504/6710 train_time:111021ms step_avg:220.28ms step:505/6710 train_time:111242ms step_avg:220.28ms step:506/6710 train_time:111465ms step_avg:220.29ms step:507/6710 train_time:111688ms step_avg:220.29ms step:508/6710 train_time:111910ms step_avg:220.30ms step:509/6710 train_time:112130ms step_avg:220.29ms step:510/6710 train_time:112352ms step_avg:220.30ms step:511/6710 train_time:112572ms step_avg:220.30ms step:512/6710 train_time:112793ms step_avg:220.30ms step:513/6710 train_time:113012ms step_avg:220.30ms step:514/6710 train_time:113232ms step_avg:220.30ms step:515/6710 train_time:113452ms step_avg:220.30ms step:516/6710 train_time:113673ms step_avg:220.30ms step:517/6710 train_time:113894ms step_avg:220.30ms step:518/6710 train_time:114113ms step_avg:220.30ms step:519/6710 train_time:114333ms step_avg:220.29ms step:520/6710 train_time:114554ms step_avg:220.30ms step:521/6710 train_time:114774ms step_avg:220.30ms step:522/6710 train_time:114995ms step_avg:220.30ms step:523/6710 train_time:115215ms step_avg:220.30ms step:524/6710 train_time:115436ms step_avg:220.30ms step:525/6710 train_time:115655ms step_avg:220.30ms step:526/6710 train_time:115876ms step_avg:220.30ms step:527/6710 train_time:116096ms step_avg:220.30ms step:528/6710 train_time:116316ms step_avg:220.30ms step:529/6710 train_time:116536ms step_avg:220.29ms step:530/6710 train_time:116756ms step_avg:220.29ms step:531/6710 train_time:116976ms step_avg:220.29ms step:532/6710 train_time:117196ms step_avg:220.29ms step:533/6710 train_time:117415ms step_avg:220.29ms step:534/6710 train_time:117634ms step_avg:220.29ms step:535/6710 train_time:117854ms step_avg:220.29ms step:536/6710 train_time:118074ms step_avg:220.29ms step:537/6710 train_time:118295ms step_avg:220.29ms step:538/6710 train_time:118515ms step_avg:220.29ms step:539/6710 train_time:118735ms step_avg:220.29ms step:540/6710 train_time:118955ms step_avg:220.29ms step:541/6710 train_time:119175ms step_avg:220.29ms step:542/6710 train_time:119396ms step_avg:220.29ms step:543/6710 train_time:119617ms step_avg:220.29ms step:544/6710 train_time:119838ms step_avg:220.29ms step:545/6710 train_time:120058ms step_avg:220.29ms step:546/6710 train_time:120276ms step_avg:220.29ms step:547/6710 train_time:120497ms step_avg:220.29ms step:548/6710 train_time:120716ms step_avg:220.29ms step:549/6710 train_time:120937ms step_avg:220.29ms step:550/6710 train_time:121159ms step_avg:220.29ms step:551/6710 train_time:121377ms step_avg:220.28ms step:552/6710 train_time:121596ms step_avg:220.28ms step:553/6710 train_time:121815ms step_avg:220.28ms step:554/6710 train_time:122036ms step_avg:220.28ms step:555/6710 train_time:122256ms step_avg:220.28ms step:556/6710 train_time:122477ms step_avg:220.28ms step:557/6710 train_time:122697ms step_avg:220.28ms step:558/6710 train_time:122916ms step_avg:220.28ms step:559/6710 train_time:123137ms step_avg:220.28ms step:560/6710 train_time:123356ms step_avg:220.28ms step:561/6710 train_time:123577ms step_avg:220.28ms step:562/6710 train_time:123797ms step_avg:220.28ms step:563/6710 train_time:124017ms step_avg:220.28ms step:564/6710 train_time:124238ms step_avg:220.28ms step:565/6710 train_time:124456ms step_avg:220.28ms step:566/6710 train_time:124676ms step_avg:220.28ms step:567/6710 train_time:124895ms step_avg:220.27ms step:568/6710 train_time:125116ms step_avg:220.27ms step:569/6710 train_time:125336ms step_avg:220.27ms step:570/6710 train_time:125557ms step_avg:220.28ms step:571/6710 train_time:125777ms step_avg:220.27ms step:572/6710 train_time:125996ms step_avg:220.27ms step:573/6710 train_time:126216ms step_avg:220.27ms step:574/6710 train_time:126436ms step_avg:220.27ms step:575/6710 train_time:126658ms step_avg:220.27ms step:576/6710 train_time:126878ms step_avg:220.27ms step:577/6710 train_time:127098ms step_avg:220.27ms step:578/6710 train_time:127320ms step_avg:220.28ms step:579/6710 train_time:127538ms step_avg:220.27ms step:580/6710 train_time:127760ms step_avg:220.28ms step:581/6710 train_time:127981ms step_avg:220.28ms step:582/6710 train_time:128202ms step_avg:220.28ms step:583/6710 train_time:128422ms step_avg:220.28ms step:584/6710 train_time:128643ms step_avg:220.28ms step:585/6710 train_time:128863ms step_avg:220.28ms step:586/6710 train_time:129085ms step_avg:220.28ms step:587/6710 train_time:129305ms step_avg:220.28ms step:588/6710 train_time:129527ms step_avg:220.28ms step:589/6710 train_time:129747ms step_avg:220.28ms step:590/6710 train_time:129969ms step_avg:220.29ms step:591/6710 train_time:130189ms step_avg:220.29ms step:592/6710 train_time:130409ms step_avg:220.29ms step:593/6710 train_time:130628ms step_avg:220.28ms step:594/6710 train_time:130850ms step_avg:220.29ms step:595/6710 train_time:131071ms step_avg:220.29ms step:596/6710 train_time:131292ms step_avg:220.29ms step:597/6710 train_time:131511ms step_avg:220.29ms step:598/6710 train_time:131731ms step_avg:220.29ms step:599/6710 train_time:131952ms step_avg:220.29ms step:600/6710 train_time:132174ms step_avg:220.29ms step:601/6710 train_time:132394ms step_avg:220.29ms step:602/6710 train_time:132612ms step_avg:220.29ms step:603/6710 train_time:132832ms step_avg:220.29ms step:604/6710 train_time:133053ms step_avg:220.29ms step:605/6710 train_time:133274ms step_avg:220.29ms step:606/6710 train_time:133494ms step_avg:220.29ms step:607/6710 train_time:133713ms step_avg:220.28ms step:608/6710 train_time:133932ms step_avg:220.28ms step:609/6710 train_time:134153ms step_avg:220.28ms step:610/6710 train_time:134372ms step_avg:220.28ms step:611/6710 train_time:134593ms step_avg:220.28ms step:612/6710 train_time:134812ms step_avg:220.28ms step:613/6710 train_time:135032ms step_avg:220.28ms step:614/6710 train_time:135252ms step_avg:220.28ms step:615/6710 train_time:135473ms step_avg:220.28ms step:616/6710 train_time:135693ms step_avg:220.28ms step:617/6710 train_time:135913ms step_avg:220.28ms step:618/6710 train_time:136132ms step_avg:220.28ms step:619/6710 train_time:136352ms step_avg:220.28ms step:620/6710 train_time:136572ms step_avg:220.28ms step:621/6710 train_time:136792ms step_avg:220.28ms step:622/6710 train_time:137012ms step_avg:220.28ms step:623/6710 train_time:137230ms step_avg:220.27ms step:624/6710 train_time:137451ms step_avg:220.27ms step:625/6710 train_time:137673ms step_avg:220.28ms step:625/6710 val_loss:3.651807 train_time:137847ms step_avg:220.55ms Parameter containing: tensor([1.0000, 1.0000, 0.5666, 1.0000, 0.7126, 1.0000, 0.6800, 1.0000], device='cuda:0', requires_grad=True) 0 [2.4187841415405273, 1.4187828302383423] 1 [0.7300053834915161, 1.4948740005493164] 2 [0.8572203516960144, 1.2401516437530518] 3 [0.6112622022628784, 0.8075787425041199] 4 [0.3839254379272461, 0.8404847383499146] 5 [0.7873216867446899, 0.9445860981941223] 6 [0.6220324039459229, 1.0636365413665771] 7 [0.8857362866401672, 1.326012372970581] 8 [0.3843573033809662, 1.0210859775543213] 9 [0.6313794851303101, 1.2290536165237427] 10 [0.7004008889198303, 1.2285677194595337] 11 [0.6149006485939026, 1.1787700653076172] 12 [1.0288426876068115, 1.1528644561767578] 13 [1.019675850868225, 0.979577898979187] 14 [0.9123057723045349, 1.1443078517913818] 15 [0.7700795531272888, 1.0910873413085938] 0 [3.8146636486053467, 6.7999267578125, 6.83552885055542] 1 [10.181269645690918, 7.403770446777344, 9.505824089050293] 2 [17.746868133544922, 6.5530500411987305, 6.34629487991333] 3 [14.820780754089355, 5.108316898345947, 8.441255569458008] 4 [9.050389289855957, 5.778351783752441, 5.966814994812012] 5 [12.926155090332031, 5.534231185913086, 8.322319030761719] 6 [13.556782722473145, 5.9115753173828125, 7.08458137512207] 7 [19.16498374938965, 0.0, 13.064538955688477] 8 [10.844491958618164, 7.066529750823975, 11.139749526977539] 9 [22.319284439086914, 5.899977684020996, 9.45158863067627] 10 [28.045522689819336, 4.618801593780518, 7.845963478088379] 11 [27.744182586669922, 6.239805221557617, 5.804182052612305] 12 [34.392486572265625, 4.665283679962158, 6.453570365905762] 13 [40.14847183227539, 6.674093723297119, 7.698970794677734] 14 [40.949344635009766, 6.954819202423096, 9.27429485321045] 15 [35.414424896240234, 15.019787788391113, 19.364063262939453] step:626/6710 train_time:137894ms step_avg:220.28ms step:627/6710 train_time:138143ms step_avg:220.32ms step:628/6710 train_time:138360ms step_avg:220.32ms step:629/6710 train_time:138577ms step_avg:220.31ms step:630/6710 train_time:138796ms step_avg:220.31ms step:631/6710 train_time:139022ms step_avg:220.32ms step:632/6710 train_time:139245ms step_avg:220.32ms step:633/6710 train_time:139464ms step_avg:220.32ms step:634/6710 train_time:139684ms step_avg:220.32ms step:635/6710 train_time:139905ms step_avg:220.32ms step:636/6710 train_time:140128ms step_avg:220.33ms step:637/6710 train_time:140349ms step_avg:220.33ms step:638/6710 train_time:140569ms step_avg:220.33ms step:639/6710 train_time:140788ms step_avg:220.33ms step:640/6710 train_time:141010ms step_avg:220.33ms step:641/6710 train_time:141231ms step_avg:220.33ms step:642/6710 train_time:141451ms step_avg:220.33ms step:643/6710 train_time:141670ms step_avg:220.33ms step:644/6710 train_time:141892ms step_avg:220.33ms step:645/6710 train_time:142112ms step_avg:220.33ms step:646/6710 train_time:142331ms step_avg:220.33ms step:647/6710 train_time:142551ms step_avg:220.33ms step:648/6710 train_time:142770ms step_avg:220.32ms step:649/6710 train_time:142991ms step_avg:220.33ms step:650/6710 train_time:143213ms step_avg:220.33ms step:651/6710 train_time:143431ms step_avg:220.32ms step:652/6710 train_time:143651ms step_avg:220.32ms step:653/6710 train_time:143872ms step_avg:220.32ms step:654/6710 train_time:144092ms step_avg:220.32ms step:655/6710 train_time:144314ms step_avg:220.33ms step:656/6710 train_time:144534ms step_avg:220.33ms step:657/6710 train_time:144754ms step_avg:220.33ms step:658/6710 train_time:144975ms step_avg:220.33ms step:659/6710 train_time:145195ms step_avg:220.33ms step:660/6710 train_time:145415ms step_avg:220.33ms step:661/6710 train_time:145634ms step_avg:220.32ms step:662/6710 train_time:145856ms step_avg:220.33ms step:663/6710 train_time:146076ms step_avg:220.33ms step:664/6710 train_time:146295ms step_avg:220.32ms step:665/6710 train_time:146515ms step_avg:220.32ms step:666/6710 train_time:146735ms step_avg:220.32ms step:667/6710 train_time:146957ms step_avg:220.32ms step:668/6710 train_time:147177ms step_avg:220.32ms step:669/6710 train_time:147397ms step_avg:220.32ms step:670/6710 train_time:147617ms step_avg:220.32ms step:671/6710 train_time:147839ms step_avg:220.33ms step:672/6710 train_time:148059ms step_avg:220.33ms step:673/6710 train_time:148280ms step_avg:220.33ms step:674/6710 train_time:148501ms step_avg:220.33ms step:675/6710 train_time:148720ms step_avg:220.33ms step:676/6710 train_time:148941ms step_avg:220.33ms step:677/6710 train_time:149161ms step_avg:220.33ms step:678/6710 train_time:149382ms step_avg:220.33ms step:679/6710 train_time:149601ms step_avg:220.33ms step:680/6710 train_time:149821ms step_avg:220.33ms step:681/6710 train_time:150044ms step_avg:220.33ms step:682/6710 train_time:150265ms step_avg:220.33ms step:683/6710 train_time:150486ms step_avg:220.33ms step:684/6710 train_time:150707ms step_avg:220.33ms step:685/6710 train_time:150928ms step_avg:220.33ms step:686/6710 train_time:151149ms step_avg:220.33ms step:687/6710 train_time:151371ms step_avg:220.34ms step:688/6710 train_time:151591ms step_avg:220.34ms step:689/6710 train_time:151812ms step_avg:220.34ms step:690/6710 train_time:152030ms step_avg:220.33ms step:691/6710 train_time:152251ms step_avg:220.33ms step:692/6710 train_time:152472ms step_avg:220.34ms step:693/6710 train_time:152693ms step_avg:220.34ms step:694/6710 train_time:152913ms step_avg:220.34ms step:695/6710 train_time:153132ms step_avg:220.33ms step:696/6710 train_time:153353ms step_avg:220.33ms step:697/6710 train_time:153573ms step_avg:220.33ms step:698/6710 train_time:153794ms step_avg:220.33ms step:699/6710 train_time:154014ms step_avg:220.33ms step:700/6710 train_time:154234ms step_avg:220.33ms step:701/6710 train_time:154455ms step_avg:220.34ms step:702/6710 train_time:154675ms step_avg:220.34ms step:703/6710 train_time:154894ms step_avg:220.33ms step:704/6710 train_time:155114ms step_avg:220.33ms step:705/6710 train_time:155334ms step_avg:220.33ms step:706/6710 train_time:155553ms step_avg:220.33ms step:707/6710 train_time:155774ms step_avg:220.33ms step:708/6710 train_time:155994ms step_avg:220.33ms step:709/6710 train_time:156214ms step_avg:220.33ms step:710/6710 train_time:156435ms step_avg:220.33ms step:711/6710 train_time:156654ms step_avg:220.33ms step:712/6710 train_time:156875ms step_avg:220.33ms step:713/6710 train_time:157095ms step_avg:220.33ms step:714/6710 train_time:157314ms step_avg:220.33ms step:715/6710 train_time:157535ms step_avg:220.33ms step:716/6710 train_time:157755ms step_avg:220.33ms step:717/6710 train_time:157976ms step_avg:220.33ms step:718/6710 train_time:158196ms step_avg:220.33ms step:719/6710 train_time:158416ms step_avg:220.33ms step:720/6710 train_time:158635ms step_avg:220.33ms step:721/6710 train_time:158855ms step_avg:220.33ms step:722/6710 train_time:159075ms step_avg:220.33ms step:723/6710 train_time:159295ms step_avg:220.33ms step:724/6710 train_time:159514ms step_avg:220.32ms step:725/6710 train_time:159734ms step_avg:220.32ms step:726/6710 train_time:159953ms step_avg:220.32ms step:727/6710 train_time:160173ms step_avg:220.32ms step:728/6710 train_time:160393ms step_avg:220.32ms step:729/6710 train_time:160612ms step_avg:220.32ms step:730/6710 train_time:160832ms step_avg:220.32ms step:731/6710 train_time:161052ms step_avg:220.32ms step:732/6710 train_time:161273ms step_avg:220.32ms step:733/6710 train_time:161492ms step_avg:220.32ms step:734/6710 train_time:161712ms step_avg:220.32ms step:735/6710 train_time:161931ms step_avg:220.31ms step:736/6710 train_time:162152ms step_avg:220.31ms step:737/6710 train_time:162371ms step_avg:220.31ms step:738/6710 train_time:162591ms step_avg:220.31ms step:739/6710 train_time:162811ms step_avg:220.31ms step:740/6710 train_time:163032ms step_avg:220.31ms step:741/6710 train_time:163250ms step_avg:220.31ms step:742/6710 train_time:163471ms step_avg:220.31ms step:743/6710 train_time:163692ms step_avg:220.31ms step:744/6710 train_time:163911ms step_avg:220.31ms step:745/6710 train_time:164131ms step_avg:220.31ms step:746/6710 train_time:164351ms step_avg:220.31ms step:747/6710 train_time:164572ms step_avg:220.31ms step:748/6710 train_time:164793ms step_avg:220.31ms step:749/6710 train_time:165013ms step_avg:220.31ms step:750/6710 train_time:165232ms step_avg:220.31ms step:750/6710 val_loss:3.585537 train_time:165405ms step_avg:220.54ms Parameter containing: tensor([1.0000, 1.0000, 0.5101, 1.0000, 0.7461, 1.0000, 0.6613, 1.0000], device='cuda:0', requires_grad=True) 0 [2.74402117729187, 1.7440202236175537] 1 [0.7321416735649109, 1.7881397008895874] 2 [0.8935027122497559, 1.5015769004821777] 3 [0.634556233882904, 0.974392294883728] 4 [0.3414563834667206, 0.9555895924568176] 5 [0.8207606673240662, 1.193078875541687] 6 [0.6141409873962402, 1.2898716926574707] 7 [0.8875970244407654, 1.6856955289840698] 8 [0.3786681294441223, 1.1819489002227783] 9 [0.6099443435668945, 1.4382983446121216] 10 [0.6902723908424377, 1.4807024002075195] 11 [0.5588752627372742, 1.4488424062728882] 12 [1.0834388732910156, 1.5533193349838257] 13 [1.0536431074142456, 1.2588664293289185] 14 [0.9251015186309814, 1.3580678701400757] 15 [0.7559914588928223, 1.2744431495666504] 0 [4.468076705932617, 8.512557983398438, 8.525074005126953] 1 [12.545405387878418, 9.030982971191406, 13.450519561767578] 2 [23.711811065673828, 7.985003471374512, 8.326971054077148] 3 [20.087820053100586, 6.910147190093994, 10.951772689819336] 4 [10.623772621154785, 7.527135372161865, 7.391313076019287] 5 [16.645523071289062, 7.030812740325928, 10.864591598510742] 6 [17.236602783203125, 7.618734359741211, 9.014126777648926] 7 [24.466917037963867, 0.0, 16.91230010986328] 8 [13.650659561157227, 9.089552879333496, 14.335888862609863] 9 [27.22168731689453, 7.5276103019714355, 11.798152923583984] 10 [34.47848129272461, 5.816084384918213, 9.856324195861816] 11 [30.767383575439453, 8.620660781860352, 6.832293510437012] 12 [41.99452209472656, 5.893966197967529, 8.113080024719238] 13 [51.159427642822266, 8.08980655670166, 10.099381446838379] 14 [52.91672134399414, 8.622786521911621, 12.534141540527344] 15 [44.81407165527344, 20.462223052978516, 27.468997955322266] step:751/6710 train_time:165452ms step_avg:220.31ms step:752/6710 train_time:165670ms step_avg:220.31ms step:753/6710 train_time:165895ms step_avg:220.31ms step:754/6710 train_time:166115ms step_avg:220.31ms step:755/6710 train_time:166333ms step_avg:220.31ms step:756/6710 train_time:166556ms step_avg:220.31ms step:757/6710 train_time:166775ms step_avg:220.31ms step:758/6710 train_time:166998ms step_avg:220.31ms step:759/6710 train_time:167218ms step_avg:220.31ms step:760/6710 train_time:167438ms step_avg:220.31ms step:761/6710 train_time:167657ms step_avg:220.31ms step:762/6710 train_time:167877ms step_avg:220.31ms step:763/6710 train_time:168098ms step_avg:220.31ms step:764/6710 train_time:168317ms step_avg:220.31ms step:765/6710 train_time:168536ms step_avg:220.31ms step:766/6710 train_time:168758ms step_avg:220.31ms step:767/6710 train_time:168979ms step_avg:220.31ms step:768/6710 train_time:169199ms step_avg:220.31ms step:769/6710 train_time:169419ms step_avg:220.31ms step:770/6710 train_time:169637ms step_avg:220.31ms step:771/6710 train_time:169857ms step_avg:220.31ms step:772/6710 train_time:170078ms step_avg:220.31ms step:773/6710 train_time:170299ms step_avg:220.31ms step:774/6710 train_time:170516ms step_avg:220.30ms step:775/6710 train_time:170735ms step_avg:220.30ms step:776/6710 train_time:170956ms step_avg:220.30ms step:777/6710 train_time:171178ms step_avg:220.31ms step:778/6710 train_time:171398ms step_avg:220.31ms step:779/6710 train_time:171617ms step_avg:220.30ms step:780/6710 train_time:171837ms step_avg:220.30ms step:781/6710 train_time:172057ms step_avg:220.30ms step:782/6710 train_time:172279ms step_avg:220.31ms step:783/6710 train_time:172498ms step_avg:220.30ms step:784/6710 train_time:172719ms step_avg:220.30ms step:785/6710 train_time:172938ms step_avg:220.30ms step:786/6710 train_time:173159ms step_avg:220.30ms step:787/6710 train_time:173379ms step_avg:220.30ms step:788/6710 train_time:173599ms step_avg:220.30ms step:789/6710 train_time:173819ms step_avg:220.30ms step:790/6710 train_time:174038ms step_avg:220.30ms step:791/6710 train_time:174257ms step_avg:220.30ms step:792/6710 train_time:174477ms step_avg:220.30ms step:793/6710 train_time:174697ms step_avg:220.30ms step:794/6710 train_time:174917ms step_avg:220.30ms step:795/6710 train_time:175136ms step_avg:220.30ms step:796/6710 train_time:175356ms step_avg:220.30ms step:797/6710 train_time:175577ms step_avg:220.30ms step:798/6710 train_time:175797ms step_avg:220.30ms step:799/6710 train_time:176016ms step_avg:220.30ms step:800/6710 train_time:176236ms step_avg:220.29ms step:801/6710 train_time:176459ms step_avg:220.30ms step:802/6710 train_time:176678ms step_avg:220.30ms step:803/6710 train_time:176898ms step_avg:220.30ms step:804/6710 train_time:177117ms step_avg:220.29ms step:805/6710 train_time:177336ms step_avg:220.29ms step:806/6710 train_time:177557ms step_avg:220.29ms step:807/6710 train_time:177779ms step_avg:220.30ms step:808/6710 train_time:177998ms step_avg:220.29ms step:809/6710 train_time:178217ms step_avg:220.29ms step:810/6710 train_time:178437ms step_avg:220.29ms step:811/6710 train_time:178657ms step_avg:220.29ms step:812/6710 train_time:178877ms step_avg:220.29ms step:813/6710 train_time:179096ms step_avg:220.29ms step:814/6710 train_time:179315ms step_avg:220.29ms step:815/6710 train_time:179535ms step_avg:220.29ms step:816/6710 train_time:179757ms step_avg:220.29ms step:817/6710 train_time:179977ms step_avg:220.29ms step:818/6710 train_time:180196ms step_avg:220.29ms step:819/6710 train_time:180417ms step_avg:220.29ms step:820/6710 train_time:180638ms step_avg:220.29ms step:821/6710 train_time:180857ms step_avg:220.29ms step:822/6710 train_time:181077ms step_avg:220.29ms step:823/6710 train_time:181297ms step_avg:220.29ms step:824/6710 train_time:181518ms step_avg:220.29ms step:825/6710 train_time:181737ms step_avg:220.29ms step:826/6710 train_time:181957ms step_avg:220.29ms step:827/6710 train_time:182178ms step_avg:220.29ms step:828/6710 train_time:182397ms step_avg:220.29ms step:829/6710 train_time:182617ms step_avg:220.29ms step:830/6710 train_time:182836ms step_avg:220.28ms step:831/6710 train_time:183056ms step_avg:220.28ms step:832/6710 train_time:183276ms step_avg:220.28ms step:833/6710 train_time:183497ms step_avg:220.28ms step:834/6710 train_time:183716ms step_avg:220.28ms step:835/6710 train_time:183936ms step_avg:220.28ms step:836/6710 train_time:184155ms step_avg:220.28ms step:837/6710 train_time:184377ms step_avg:220.28ms step:838/6710 train_time:184597ms step_avg:220.28ms step:839/6710 train_time:184816ms step_avg:220.28ms step:840/6710 train_time:185036ms step_avg:220.28ms step:841/6710 train_time:185256ms step_avg:220.28ms step:842/6710 train_time:185477ms step_avg:220.28ms step:843/6710 train_time:185698ms step_avg:220.28ms step:844/6710 train_time:185916ms step_avg:220.28ms step:845/6710 train_time:186136ms step_avg:220.28ms step:846/6710 train_time:186356ms step_avg:220.28ms step:847/6710 train_time:186576ms step_avg:220.28ms step:848/6710 train_time:186796ms step_avg:220.28ms step:849/6710 train_time:187015ms step_avg:220.28ms step:850/6710 train_time:187234ms step_avg:220.28ms step:851/6710 train_time:187456ms step_avg:220.28ms step:852/6710 train_time:187676ms step_avg:220.28ms step:853/6710 train_time:187897ms step_avg:220.28ms step:854/6710 train_time:188116ms step_avg:220.28ms step:855/6710 train_time:188335ms step_avg:220.28ms step:856/6710 train_time:188557ms step_avg:220.28ms step:857/6710 train_time:188779ms step_avg:220.28ms step:858/6710 train_time:188997ms step_avg:220.28ms step:859/6710 train_time:189216ms step_avg:220.27ms step:860/6710 train_time:189435ms step_avg:220.27ms step:861/6710 train_time:189655ms step_avg:220.27ms step:862/6710 train_time:189877ms step_avg:220.27ms step:863/6710 train_time:190097ms step_avg:220.27ms step:864/6710 train_time:190315ms step_avg:220.27ms step:865/6710 train_time:190536ms step_avg:220.27ms step:866/6710 train_time:190756ms step_avg:220.27ms step:867/6710 train_time:190977ms step_avg:220.27ms step:868/6710 train_time:191196ms step_avg:220.27ms step:869/6710 train_time:191415ms step_avg:220.27ms step:870/6710 train_time:191636ms step_avg:220.27ms step:871/6710 train_time:191856ms step_avg:220.27ms step:872/6710 train_time:192077ms step_avg:220.27ms step:873/6710 train_time:192297ms step_avg:220.27ms step:874/6710 train_time:192516ms step_avg:220.27ms step:875/6710 train_time:192736ms step_avg:220.27ms step:875/6710 val_loss:3.535389 train_time:192909ms step_avg:220.47ms Parameter containing: tensor([1.0000, 1.0000, 0.4717, 1.0000, 0.7641, 1.0000, 0.6427, 1.0000], device='cuda:0', requires_grad=True) 0 [3.0877749919891357, 2.0877721309661865] 1 [0.7280318737030029, 2.078738212585449] 2 [0.9031692147254944, 1.7426633834838867] 3 [0.6408694386482239, 1.159558892250061] 4 [0.31936150789260864, 1.0705962181091309] 5 [0.8483643531799316, 1.4686551094055176] 6 [0.5950151681900024, 1.5403730869293213] 7 [0.8775723576545715, 2.0643608570098877] 8 [0.38042691349983215, 1.28813636302948] 9 [0.5923682451248169, 1.5922040939331055] 10 [0.6780117154121399, 1.6629388332366943] 11 [0.5163789391517639, 1.663699746131897] 12 [1.1210215091705322, 1.9427032470703125] 13 [1.0796536207199097, 1.5177631378173828] 14 [0.9375514984130859, 1.552903413772583] 15 [0.7524945735931396, 1.463065505027771] 0 [5.154561996459961, 10.233156204223633, 9.833720207214355] 1 [14.646698951721191, 10.51347541809082, 16.311628341674805] 2 [28.275840759277344, 9.477932929992676, 10.593863487243652] 3 [24.418088912963867, 8.77369213104248, 13.604957580566406] 4 [12.16740894317627, 9.316473007202148, 8.696927070617676] 5 [20.319721221923828, 8.489212989807129, 13.14514446258545] 6 [20.273704528808594, 9.319299697875977, 10.925457000732422] 7 [28.87085723876953, 0.0, 20.29808235168457] 8 [16.206335067749023, 11.15263557434082, 17.35682487487793] 9 [31.322702407836914, 9.125078201293945, 14.021162986755371] 10 [39.84978485107422, 7.03800106048584, 11.889792442321777] 11 [32.865928649902344, 10.841344833374023, 7.74107551574707] 12 [48.312408447265625, 7.144101619720459, 9.713178634643555] 13 [60.91452407836914, 9.521580696105957, 12.49880599975586] 14 [64.06417083740234, 10.492066383361816, 16.02152442932129] 15 [54.34141159057617, 25.53639793395996, 34.353660583496094] step:876/6710 train_time:192957ms step_avg:220.27ms step:877/6710 train_time:193173ms step_avg:220.27ms step:878/6710 train_time:193399ms step_avg:220.27ms step:879/6710 train_time:193618ms step_avg:220.27ms step:880/6710 train_time:193836ms step_avg:220.27ms step:881/6710 train_time:194057ms step_avg:220.27ms step:882/6710 train_time:194278ms step_avg:220.27ms step:883/6710 train_time:194500ms step_avg:220.27ms step:884/6710 train_time:194719ms step_avg:220.27ms step:885/6710 train_time:194941ms step_avg:220.27ms step:886/6710 train_time:195160ms step_avg:220.27ms step:887/6710 train_time:195383ms step_avg:220.27ms step:888/6710 train_time:195604ms step_avg:220.28ms step:889/6710 train_time:195825ms step_avg:220.28ms step:890/6710 train_time:196045ms step_avg:220.28ms step:891/6710 train_time:196266ms step_avg:220.28ms step:892/6710 train_time:196488ms step_avg:220.28ms step:893/6710 train_time:196708ms step_avg:220.28ms step:894/6710 train_time:196928ms step_avg:220.28ms step:895/6710 train_time:197149ms step_avg:220.28ms step:896/6710 train_time:197371ms step_avg:220.28ms step:897/6710 train_time:197590ms step_avg:220.28ms step:898/6710 train_time:197810ms step_avg:220.28ms step:899/6710 train_time:198029ms step_avg:220.28ms step:900/6710 train_time:198250ms step_avg:220.28ms step:901/6710 train_time:198471ms step_avg:220.28ms step:902/6710 train_time:198691ms step_avg:220.28ms step:903/6710 train_time:198909ms step_avg:220.28ms step:904/6710 train_time:199129ms step_avg:220.28ms step:905/6710 train_time:199349ms step_avg:220.27ms step:906/6710 train_time:199570ms step_avg:220.28ms step:907/6710 train_time:199792ms step_avg:220.28ms step:908/6710 train_time:200012ms step_avg:220.28ms step:909/6710 train_time:200230ms step_avg:220.28ms step:910/6710 train_time:200451ms step_avg:220.28ms step:911/6710 train_time:200671ms step_avg:220.28ms step:912/6710 train_time:200890ms step_avg:220.27ms step:913/6710 train_time:201110ms step_avg:220.27ms step:914/6710 train_time:201331ms step_avg:220.27ms step:915/6710 train_time:201551ms step_avg:220.27ms step:916/6710 train_time:201771ms step_avg:220.27ms step:917/6710 train_time:201990ms step_avg:220.27ms step:918/6710 train_time:202210ms step_avg:220.27ms step:919/6710 train_time:202430ms step_avg:220.27ms step:920/6710 train_time:202649ms step_avg:220.27ms step:921/6710 train_time:202870ms step_avg:220.27ms step:922/6710 train_time:203090ms step_avg:220.27ms step:923/6710 train_time:203311ms step_avg:220.27ms step:924/6710 train_time:203530ms step_avg:220.27ms step:925/6710 train_time:203749ms step_avg:220.27ms step:926/6710 train_time:203970ms step_avg:220.27ms step:927/6710 train_time:204191ms step_avg:220.27ms step:928/6710 train_time:204412ms step_avg:220.27ms step:929/6710 train_time:204631ms step_avg:220.27ms step:930/6710 train_time:204849ms step_avg:220.27ms step:931/6710 train_time:205071ms step_avg:220.27ms step:932/6710 train_time:205292ms step_avg:220.27ms step:933/6710 train_time:205512ms step_avg:220.27ms step:934/6710 train_time:205731ms step_avg:220.27ms step:935/6710 train_time:205951ms step_avg:220.27ms step:936/6710 train_time:206171ms step_avg:220.27ms step:937/6710 train_time:206392ms step_avg:220.27ms step:938/6710 train_time:206610ms step_avg:220.27ms step:939/6710 train_time:206831ms step_avg:220.27ms step:940/6710 train_time:207051ms step_avg:220.27ms step:941/6710 train_time:207271ms step_avg:220.27ms step:942/6710 train_time:207491ms step_avg:220.27ms step:943/6710 train_time:207710ms step_avg:220.26ms step:944/6710 train_time:207928ms step_avg:220.26ms step:945/6710 train_time:208149ms step_avg:220.26ms step:946/6710 train_time:208370ms step_avg:220.26ms step:947/6710 train_time:208590ms step_avg:220.26ms step:948/6710 train_time:208811ms step_avg:220.26ms step:949/6710 train_time:209030ms step_avg:220.26ms step:950/6710 train_time:209251ms step_avg:220.26ms step:951/6710 train_time:209471ms step_avg:220.26ms step:952/6710 train_time:209691ms step_avg:220.26ms step:953/6710 train_time:209911ms step_avg:220.26ms step:954/6710 train_time:210131ms step_avg:220.26ms step:955/6710 train_time:210351ms step_avg:220.26ms step:956/6710 train_time:210570ms step_avg:220.26ms step:957/6710 train_time:210791ms step_avg:220.26ms step:958/6710 train_time:211011ms step_avg:220.26ms step:959/6710 train_time:211231ms step_avg:220.26ms step:960/6710 train_time:211450ms step_avg:220.26ms step:961/6710 train_time:211670ms step_avg:220.26ms step:962/6710 train_time:211890ms step_avg:220.26ms step:963/6710 train_time:212109ms step_avg:220.26ms step:964/6710 train_time:212330ms step_avg:220.26ms step:965/6710 train_time:212549ms step_avg:220.26ms step:966/6710 train_time:212769ms step_avg:220.26ms step:967/6710 train_time:212989ms step_avg:220.26ms step:968/6710 train_time:213209ms step_avg:220.26ms step:969/6710 train_time:213430ms step_avg:220.26ms step:970/6710 train_time:213650ms step_avg:220.26ms step:971/6710 train_time:213872ms step_avg:220.26ms step:972/6710 train_time:214091ms step_avg:220.26ms step:973/6710 train_time:214310ms step_avg:220.26ms step:974/6710 train_time:214529ms step_avg:220.26ms step:975/6710 train_time:214747ms step_avg:220.25ms step:976/6710 train_time:214970ms step_avg:220.26ms step:977/6710 train_time:215190ms step_avg:220.26ms step:978/6710 train_time:215411ms step_avg:220.26ms step:979/6710 train_time:215630ms step_avg:220.26ms step:980/6710 train_time:215849ms step_avg:220.25ms step:981/6710 train_time:216069ms step_avg:220.25ms step:982/6710 train_time:216290ms step_avg:220.25ms step:983/6710 train_time:216510ms step_avg:220.25ms step:984/6710 train_time:216730ms step_avg:220.25ms step:985/6710 train_time:216950ms step_avg:220.25ms step:986/6710 train_time:217170ms step_avg:220.25ms step:987/6710 train_time:217390ms step_avg:220.25ms step:988/6710 train_time:217610ms step_avg:220.25ms step:989/6710 train_time:217829ms step_avg:220.25ms step:990/6710 train_time:218049ms step_avg:220.25ms step:991/6710 train_time:218271ms step_avg:220.25ms step:992/6710 train_time:218491ms step_avg:220.25ms step:993/6710 train_time:218711ms step_avg:220.25ms step:994/6710 train_time:218931ms step_avg:220.25ms step:995/6710 train_time:219150ms step_avg:220.25ms step:996/6710 train_time:219370ms step_avg:220.25ms step:997/6710 train_time:219591ms step_avg:220.25ms step:998/6710 train_time:219812ms step_avg:220.25ms step:999/6710 train_time:220032ms step_avg:220.25ms step:1000/6710 train_time:220253ms step_avg:220.25ms step:1000/6710 val_loss:3.462700 train_time:220426ms step_avg:220.43ms Parameter containing: tensor([1.0000, 1.0000, 0.4477, 1.0000, 0.7790, 1.0000, 0.6341, 1.0000], device='cuda:0', requires_grad=True) 0 [3.388371229171753, 2.3883683681488037] 1 [0.7356235980987549, 2.363144636154175] 2 [0.9252156019210815, 1.9829986095428467] 3 [0.6399906873703003, 1.3692413568496704] 4 [0.2958710193634033, 1.2087140083312988] 5 [0.8730360865592957, 1.715943694114685] 6 [0.6021972298622131, 1.7210946083068848] 7 [0.8678487539291382, 2.42122745513916] 8 [0.38422638177871704, 1.3970167636871338] 9 [0.5758576393127441, 1.7378829717636108] 10 [0.670581042766571, 1.820213794708252] 11 [0.47821134328842163, 1.8316781520843506] 12 [1.1447323560714722, 2.3064582347869873] 13 [1.0925027132034302, 1.7550370693206787] 14 [0.9428306818008423, 1.7178595066070557] 15 [0.7474075555801392, 1.6087706089019775] 0 [5.758079528808594, 11.713626861572266, 11.19619369506836] 1 [16.788022994995117, 12.09055233001709, 20.639055252075195] 2 [34.3189811706543, 10.730297088623047, 12.49694538116455] 3 [29.101146697998047, 10.668548583984375, 15.755914688110352] 4 [13.33530330657959, 10.87753963470459, 10.014774322509766] 5 [23.714054107666016, 9.809249877929688, 15.350424766540527] 6 [23.755123138427734, 11.091100692749023, 12.641606330871582] 7 [33.41707992553711, 0.0, 23.113792419433594] 8 [18.791845321655273, 12.969682693481445, 19.974586486816406] 9 [35.20585632324219, 10.692063331604004, 16.197328567504883] 10 [45.02701950073242, 8.297921180725098, 13.758855819702148] 11 [34.608741760253906, 12.877859115600586, 8.137834548950195] 12 [53.573116302490234, 8.337746620178223, 10.600318908691406] 13 [68.56715393066406, 10.303685188293457, 14.112192153930664] 14 [72.38459014892578, 11.76253890991211, 19.33110809326172] 15 [61.02833557128906, 32.001956939697266, 40.90986633300781] step:1001/6710 train_time:220475ms step_avg:220.25ms step:1002/6710 train_time:220690ms step_avg:220.25ms step:1003/6710 train_time:220914ms step_avg:220.25ms step:1004/6710 train_time:221136ms step_avg:220.25ms step:1005/6710 train_time:221356ms step_avg:220.25ms step:1006/6710 train_time:221580ms step_avg:220.26ms step:1007/6710 train_time:221800ms step_avg:220.26ms step:1008/6710 train_time:222022ms step_avg:220.26ms step:1009/6710 train_time:222243ms step_avg:220.26ms step:1010/6710 train_time:222466ms step_avg:220.26ms step:1011/6710 train_time:222689ms step_avg:220.27ms step:1012/6710 train_time:222911ms step_avg:220.27ms step:1013/6710 train_time:223133ms step_avg:220.27ms step:1014/6710 train_time:223354ms step_avg:220.27ms step:1015/6710 train_time:223577ms step_avg:220.27ms step:1016/6710 train_time:223798ms step_avg:220.27ms step:1017/6710 train_time:224019ms step_avg:220.27ms step:1018/6710 train_time:224239ms step_avg:220.27ms step:1019/6710 train_time:224460ms step_avg:220.27ms step:1020/6710 train_time:224682ms step_avg:220.28ms step:1021/6710 train_time:224903ms step_avg:220.28ms step:1022/6710 train_time:225124ms step_avg:220.28ms step:1023/6710 train_time:225345ms step_avg:220.28ms step:1024/6710 train_time:225568ms step_avg:220.28ms step:1025/6710 train_time:225790ms step_avg:220.28ms step:1026/6710 train_time:226012ms step_avg:220.28ms step:1027/6710 train_time:226232ms step_avg:220.28ms step:1028/6710 train_time:226455ms step_avg:220.29ms step:1029/6710 train_time:226676ms step_avg:220.29ms step:1030/6710 train_time:226896ms step_avg:220.29ms step:1031/6710 train_time:227117ms step_avg:220.29ms step:1032/6710 train_time:227338ms step_avg:220.29ms step:1033/6710 train_time:227557ms step_avg:220.29ms step:1034/6710 train_time:227777ms step_avg:220.29ms step:1035/6710 train_time:227998ms step_avg:220.29ms step:1036/6710 train_time:228218ms step_avg:220.29ms step:1037/6710 train_time:228439ms step_avg:220.29ms step:1038/6710 train_time:228662ms step_avg:220.29ms step:1039/6710 train_time:228884ms step_avg:220.29ms step:1040/6710 train_time:229106ms step_avg:220.29ms step:1041/6710 train_time:229328ms step_avg:220.30ms step:1042/6710 train_time:229550ms step_avg:220.30ms step:1043/6710 train_time:229772ms step_avg:220.30ms step:1044/6710 train_time:229994ms step_avg:220.30ms step:1045/6710 train_time:230216ms step_avg:220.30ms step:1046/6710 train_time:230438ms step_avg:220.30ms step:1047/6710 train_time:230658ms step_avg:220.30ms step:1048/6710 train_time:230879ms step_avg:220.30ms step:1049/6710 train_time:231099ms step_avg:220.30ms step:1050/6710 train_time:231320ms step_avg:220.30ms step:1051/6710 train_time:231541ms step_avg:220.31ms step:1052/6710 train_time:231761ms step_avg:220.31ms step:1053/6710 train_time:231982ms step_avg:220.31ms step:1054/6710 train_time:232204ms step_avg:220.31ms step:1055/6710 train_time:232428ms step_avg:220.31ms step:1056/6710 train_time:232650ms step_avg:220.31ms step:1057/6710 train_time:232871ms step_avg:220.31ms step:1058/6710 train_time:233092ms step_avg:220.31ms step:1059/6710 train_time:233313ms step_avg:220.31ms step:1060/6710 train_time:233534ms step_avg:220.32ms step:1061/6710 train_time:233756ms step_avg:220.32ms step:1062/6710 train_time:233976ms step_avg:220.32ms step:1063/6710 train_time:234197ms step_avg:220.32ms step:1064/6710 train_time:234418ms step_avg:220.32ms step:1065/6710 train_time:234637ms step_avg:220.32ms step:1066/6710 train_time:234857ms step_avg:220.32ms step:1067/6710 train_time:235078ms step_avg:220.32ms step:1068/6710 train_time:235298ms step_avg:220.32ms step:1069/6710 train_time:235518ms step_avg:220.32ms step:1070/6710 train_time:235739ms step_avg:220.32ms step:1071/6710 train_time:235959ms step_avg:220.32ms step:1072/6710 train_time:236180ms step_avg:220.32ms step:1073/6710 train_time:236400ms step_avg:220.32ms step:1074/6710 train_time:236622ms step_avg:220.32ms step:1075/6710 train_time:236843ms step_avg:220.32ms step:1076/6710 train_time:237065ms step_avg:220.32ms step:1077/6710 train_time:237286ms step_avg:220.32ms step:1078/6710 train_time:237508ms step_avg:220.32ms step:1079/6710 train_time:237729ms step_avg:220.32ms step:1080/6710 train_time:237951ms step_avg:220.33ms step:1081/6710 train_time:238173ms step_avg:220.33ms step:1082/6710 train_time:238396ms step_avg:220.33ms step:1083/6710 train_time:238616ms step_avg:220.33ms step:1084/6710 train_time:238837ms step_avg:220.33ms step:1085/6710 train_time:239057ms step_avg:220.33ms step:1086/6710 train_time:239278ms step_avg:220.33ms step:1087/6710 train_time:239499ms step_avg:220.33ms step:1088/6710 train_time:239719ms step_avg:220.33ms step:1089/6710 train_time:239939ms step_avg:220.33ms step:1090/6710 train_time:240160ms step_avg:220.33ms step:1091/6710 train_time:240381ms step_avg:220.33ms step:1092/6710 train_time:240602ms step_avg:220.33ms step:1093/6710 train_time:240824ms step_avg:220.33ms step:1094/6710 train_time:241046ms step_avg:220.33ms step:1095/6710 train_time:241269ms step_avg:220.34ms step:1096/6710 train_time:241492ms step_avg:220.34ms step:1097/6710 train_time:241713ms step_avg:220.34ms step:1098/6710 train_time:241935ms step_avg:220.34ms step:1099/6710 train_time:242155ms step_avg:220.34ms step:1100/6710 train_time:242377ms step_avg:220.34ms step:1101/6710 train_time:242598ms step_avg:220.34ms step:1102/6710 train_time:242819ms step_avg:220.34ms step:1103/6710 train_time:243040ms step_avg:220.34ms step:1104/6710 train_time:243260ms step_avg:220.34ms step:1105/6710 train_time:243481ms step_avg:220.34ms step:1106/6710 train_time:243700ms step_avg:220.34ms step:1107/6710 train_time:243921ms step_avg:220.34ms step:1108/6710 train_time:244143ms step_avg:220.35ms step:1109/6710 train_time:244363ms step_avg:220.35ms step:1110/6710 train_time:244584ms step_avg:220.35ms step:1111/6710 train_time:244807ms step_avg:220.35ms step:1112/6710 train_time:245028ms step_avg:220.35ms step:1113/6710 train_time:245251ms step_avg:220.35ms step:1114/6710 train_time:245473ms step_avg:220.35ms step:1115/6710 train_time:245694ms step_avg:220.35ms step:1116/6710 train_time:245916ms step_avg:220.35ms step:1117/6710 train_time:246136ms step_avg:220.35ms step:1118/6710 train_time:246358ms step_avg:220.36ms step:1119/6710 train_time:246580ms step_avg:220.36ms step:1120/6710 train_time:246801ms step_avg:220.36ms step:1121/6710 train_time:247023ms step_avg:220.36ms step:1122/6710 train_time:247245ms step_avg:220.36ms step:1123/6710 train_time:247466ms step_avg:220.36ms step:1124/6710 train_time:247688ms step_avg:220.36ms step:1125/6710 train_time:247910ms step_avg:220.36ms step:1125/6710 val_loss:3.429494 train_time:248085ms step_avg:220.52ms Parameter containing: tensor([1.0000, 1.0000, 0.4301, 1.0000, 0.7853, 1.0000, 0.6160, 1.0000], device='cuda:0', requires_grad=True) 0 [3.6870951652526855, 2.6870923042297363] 1 [0.7209855914115906, 2.6304123401641846] 2 [0.9220405220985413, 2.2020936012268066] 3 [0.6416423916816711, 1.5429353713989258] 4 [0.28592613339424133, 1.291837453842163] 5 [0.8950182795524597, 1.9364265203475952] 6 [0.5908427238464355, 1.9124475717544556] 7 [0.8606324195861816, 2.7105729579925537] 8 [0.3846510648727417, 1.470832347869873] 9 [0.5650331974029541, 1.8678531646728516] 10 [0.6675003170967102, 1.9479281902313232] 11 [0.4546341300010681, 1.941491723060608] 12 [1.1693615913391113, 2.626675844192505] 13 [1.1000384092330933, 1.9029452800750732] 14 [0.9426565170288086, 1.7541658878326416] 15 [0.7282420992851257, 1.630362868309021] 0 [6.355682849884033, 13.126569747924805, 12.828007698059082] 1 [18.561023712158203, 13.272320747375488, 26.93839454650879] 2 [40.35435485839844, 12.152326583862305, 15.025140762329102] 3 [34.0111083984375, 12.487444877624512, 17.97410774230957] 4 [14.857300758361816, 12.655858993530273, 10.948958396911621] 5 [27.254329681396484, 11.04543685913086, 17.625843048095703] 6 [26.61054229736328, 12.629556655883789, 14.586552619934082] 7 [37.40536880493164, 0.0, 26.336605072021484] 8 [21.107723236083984, 14.698806762695312, 23.761802673339844] 9 [38.91875457763672, 11.994935989379883, 18.84333610534668] 10 [50.08892822265625, 9.40845775604248, 16.121721267700195] 11 [36.75440216064453, 14.91235065460205, 9.361502647399902] 12 [59.721954345703125, 9.59050464630127, 12.488187789916992] 13 [77.66492462158203, 11.276927947998047, 16.602134704589844] 14 [82.24966430664062, 12.882467269897461, 21.947715759277344] 15 [67.8804931640625, 36.285003662109375, 47.32188415527344] step:1126/6710 train_time:248133ms step_avg:220.37ms step:1127/6710 train_time:248350ms step_avg:220.36ms step:1128/6710 train_time:248578ms step_avg:220.37ms step:1129/6710 train_time:248797ms step_avg:220.37ms step:1130/6710 train_time:249018ms step_avg:220.37ms step:1131/6710 train_time:249241ms step_avg:220.37ms step:1132/6710 train_time:249462ms step_avg:220.37ms step:1133/6710 train_time:249685ms step_avg:220.38ms step:1134/6710 train_time:249906ms step_avg:220.38ms step:1135/6710 train_time:250128ms step_avg:220.38ms step:1136/6710 train_time:250351ms step_avg:220.38ms step:1137/6710 train_time:250574ms step_avg:220.38ms step:1138/6710 train_time:250796ms step_avg:220.38ms step:1139/6710 train_time:251018ms step_avg:220.38ms step:1140/6710 train_time:251238ms step_avg:220.38ms step:1141/6710 train_time:251458ms step_avg:220.38ms step:1142/6710 train_time:251680ms step_avg:220.39ms step:1143/6710 train_time:251900ms step_avg:220.39ms step:1144/6710 train_time:252121ms step_avg:220.39ms step:1145/6710 train_time:252341ms step_avg:220.39ms step:1146/6710 train_time:252563ms step_avg:220.39ms step:1147/6710 train_time:252783ms step_avg:220.39ms step:1148/6710 train_time:253006ms step_avg:220.39ms step:1149/6710 train_time:253227ms step_avg:220.39ms step:1150/6710 train_time:253448ms step_avg:220.39ms step:1151/6710 train_time:253671ms step_avg:220.39ms step:1152/6710 train_time:253893ms step_avg:220.39ms step:1153/6710 train_time:254114ms step_avg:220.39ms step:1154/6710 train_time:254336ms step_avg:220.39ms step:1155/6710 train_time:254558ms step_avg:220.40ms step:1156/6710 train_time:254780ms step_avg:220.40ms step:1157/6710 train_time:255002ms step_avg:220.40ms step:1158/6710 train_time:255223ms step_avg:220.40ms step:1159/6710 train_time:255442ms step_avg:220.40ms step:1160/6710 train_time:255663ms step_avg:220.40ms step:1161/6710 train_time:255885ms step_avg:220.40ms step:1162/6710 train_time:256105ms step_avg:220.40ms step:1163/6710 train_time:256328ms step_avg:220.40ms step:1164/6710 train_time:256548ms step_avg:220.40ms step:1165/6710 train_time:256771ms step_avg:220.40ms step:1166/6710 train_time:256994ms step_avg:220.41ms step:1167/6710 train_time:257218ms step_avg:220.41ms step:1168/6710 train_time:257439ms step_avg:220.41ms step:1169/6710 train_time:257659ms step_avg:220.41ms step:1170/6710 train_time:257880ms step_avg:220.41ms step:1171/6710 train_time:258100ms step_avg:220.41ms step:1172/6710 train_time:258322ms step_avg:220.41ms step:1173/6710 train_time:258542ms step_avg:220.41ms step:1174/6710 train_time:258763ms step_avg:220.41ms step:1175/6710 train_time:258986ms step_avg:220.41ms step:1176/6710 train_time:259207ms step_avg:220.41ms step:1177/6710 train_time:259430ms step_avg:220.42ms step:1178/6710 train_time:259653ms step_avg:220.42ms step:1179/6710 train_time:259874ms step_avg:220.42ms step:1180/6710 train_time:260098ms step_avg:220.42ms step:1181/6710 train_time:260320ms step_avg:220.42ms step:1182/6710 train_time:260541ms step_avg:220.42ms step:1183/6710 train_time:260761ms step_avg:220.42ms step:1184/6710 train_time:260983ms step_avg:220.42ms step:1185/6710 train_time:261205ms step_avg:220.43ms step:1186/6710 train_time:261426ms step_avg:220.43ms step:1187/6710 train_time:261645ms step_avg:220.43ms step:1188/6710 train_time:261865ms step_avg:220.43ms step:1189/6710 train_time:262088ms step_avg:220.43ms step:1190/6710 train_time:262310ms step_avg:220.43ms step:1191/6710 train_time:262532ms step_avg:220.43ms step:1192/6710 train_time:262755ms step_avg:220.43ms step:1193/6710 train_time:262977ms step_avg:220.43ms step:1194/6710 train_time:263198ms step_avg:220.43ms step:1195/6710 train_time:263418ms step_avg:220.43ms step:1196/6710 train_time:263638ms step_avg:220.43ms step:1197/6710 train_time:263858ms step_avg:220.43ms step:1198/6710 train_time:264080ms step_avg:220.43ms step:1199/6710 train_time:264300ms step_avg:220.43ms step:1200/6710 train_time:264520ms step_avg:220.43ms step:1201/6710 train_time:264742ms step_avg:220.43ms step:1202/6710 train_time:264962ms step_avg:220.43ms step:1203/6710 train_time:265182ms step_avg:220.43ms step:1204/6710 train_time:265403ms step_avg:220.43ms step:1205/6710 train_time:265623ms step_avg:220.43ms step:1206/6710 train_time:265843ms step_avg:220.43ms step:1207/6710 train_time:266064ms step_avg:220.43ms step:1208/6710 train_time:266285ms step_avg:220.43ms step:1209/6710 train_time:266506ms step_avg:220.44ms step:1210/6710 train_time:266728ms step_avg:220.44ms step:1211/6710 train_time:266949ms step_avg:220.44ms step:1212/6710 train_time:267171ms step_avg:220.44ms step:1213/6710 train_time:267394ms step_avg:220.44ms step:1214/6710 train_time:267616ms step_avg:220.44ms step:1215/6710 train_time:267838ms step_avg:220.44ms step:1216/6710 train_time:268058ms step_avg:220.44ms step:1217/6710 train_time:268279ms step_avg:220.44ms step:1218/6710 train_time:268501ms step_avg:220.44ms step:1219/6710 train_time:268723ms step_avg:220.45ms step:1220/6710 train_time:268942ms step_avg:220.44ms step:1221/6710 train_time:269164ms step_avg:220.45ms step:1222/6710 train_time:269385ms step_avg:220.45ms step:1223/6710 train_time:269606ms step_avg:220.45ms step:1224/6710 train_time:269827ms step_avg:220.45ms step:1225/6710 train_time:270049ms step_avg:220.45ms step:1226/6710 train_time:270269ms step_avg:220.45ms step:1227/6710 train_time:270492ms step_avg:220.45ms step:1228/6710 train_time:270714ms step_avg:220.45ms step:1229/6710 train_time:270936ms step_avg:220.45ms step:1230/6710 train_time:271157ms step_avg:220.45ms step:1231/6710 train_time:271378ms step_avg:220.45ms step:1232/6710 train_time:271599ms step_avg:220.45ms step:1233/6710 train_time:271820ms step_avg:220.45ms step:1234/6710 train_time:272041ms step_avg:220.45ms step:1235/6710 train_time:272262ms step_avg:220.46ms step:1236/6710 train_time:272482ms step_avg:220.46ms step:1237/6710 train_time:272703ms step_avg:220.46ms step:1238/6710 train_time:272924ms step_avg:220.46ms step:1239/6710 train_time:273144ms step_avg:220.46ms step:1240/6710 train_time:273366ms step_avg:220.46ms step:1241/6710 train_time:273587ms step_avg:220.46ms step:1242/6710 train_time:273810ms step_avg:220.46ms step:1243/6710 train_time:274032ms step_avg:220.46ms step:1244/6710 train_time:274254ms step_avg:220.46ms step:1245/6710 train_time:274475ms step_avg:220.46ms step:1246/6710 train_time:274698ms step_avg:220.46ms step:1247/6710 train_time:274919ms step_avg:220.46ms step:1248/6710 train_time:275140ms step_avg:220.46ms step:1249/6710 train_time:275360ms step_avg:220.46ms step:1250/6710 train_time:275581ms step_avg:220.46ms step:1250/6710 val_loss:3.400618 train_time:275754ms step_avg:220.60ms Parameter containing: tensor([1.0000, 1.0000, 0.4203, 1.0000, 0.7892, 1.0000, 0.6074, 1.0000], device='cuda:0', requires_grad=True) 0 [3.9739060401916504, 2.973903179168701] 1 [0.7091032862663269, 2.8970937728881836] 2 [0.9207925796508789, 2.42252254486084] 3 [0.63188236951828, 1.7384213209152222] 4 [0.27083471417427063, 1.4119735956192017] 5 [0.9092891812324524, 2.183462381362915] 6 [0.5891609787940979, 2.095989942550659] 7 [0.8569706678390503, 3.026293992996216] 8 [0.38332822918891907, 1.5588637590408325] 9 [0.5584778189659119, 1.9827752113342285] 10 [0.6628251671791077, 2.0789740085601807] 11 [0.4379427433013916, 2.0591306686401367] 12 [1.1775442361831665, 2.936940908432007] 13 [1.1090525388717651, 2.0906982421875] 14 [0.9512550234794617, 1.8489432334899902] 15 [0.7330122590065002, 1.6997528076171875] 0 [6.929716110229492, 14.598044395446777, 14.292770385742188] 1 [20.254180908203125, 14.696621894836426, 31.222326278686523] 2 [45.21142578125, 13.475412368774414, 17.01280975341797] 3 [37.48884963989258, 14.120287895202637, 20.2734432220459] 4 [15.631142616271973, 14.161048889160156, 12.181936264038086] 5 [30.126880645751953, 12.300817489624023, 19.963348388671875] 6 [29.446924209594727, 14.216377258300781, 16.094091415405273] 7 [41.222660064697266, 0.0, 29.305938720703125] 8 [23.220840454101562, 16.506065368652344, 26.13033103942871] 9 [42.21305465698242, 13.430880546569824, 20.662940979003906] 10 [54.21799850463867, 10.600054740905762, 17.934839248657227] 11 [38.52985763549805, 17.094709396362305, 10.097570419311523] 12 [64.82605743408203, 10.776372909545898, 13.750439643859863] 13 [85.4646987915039, 12.355538368225098, 18.54092788696289] 14 [91.43362426757812, 14.411285400390625, 24.75998878479004] 15 [76.23210906982422, 41.312416076660156, 56.01831817626953] step:1251/6710 train_time:275802ms step_avg:220.47ms step:1252/6710 train_time:276026ms step_avg:220.47ms step:1253/6710 train_time:276245ms step_avg:220.47ms step:1254/6710 train_time:276466ms step_avg:220.47ms step:1255/6710 train_time:276688ms step_avg:220.47ms step:1256/6710 train_time:276911ms step_avg:220.47ms step:1257/6710 train_time:277132ms step_avg:220.47ms step:1258/6710 train_time:277352ms step_avg:220.47ms step:1259/6710 train_time:277572ms step_avg:220.47ms step:1260/6710 train_time:277794ms step_avg:220.47ms step:1261/6710 train_time:278016ms step_avg:220.47ms step:1262/6710 train_time:278235ms step_avg:220.47ms step:1263/6710 train_time:278456ms step_avg:220.47ms step:1264/6710 train_time:278679ms step_avg:220.47ms step:1265/6710 train_time:278902ms step_avg:220.48ms step:1266/6710 train_time:279125ms step_avg:220.48ms step:1267/6710 train_time:279347ms step_avg:220.48ms step:1268/6710 train_time:279566ms step_avg:220.48ms step:1269/6710 train_time:279788ms step_avg:220.48ms step:1270/6710 train_time:280009ms step_avg:220.48ms step:1271/6710 train_time:280230ms step_avg:220.48ms step:1272/6710 train_time:280449ms step_avg:220.48ms step:1273/6710 train_time:280669ms step_avg:220.48ms step:1274/6710 train_time:280891ms step_avg:220.48ms step:1275/6710 train_time:281111ms step_avg:220.48ms step:1276/6710 train_time:281331ms step_avg:220.48ms step:1277/6710 train_time:281550ms step_avg:220.48ms step:1278/6710 train_time:281772ms step_avg:220.48ms step:1279/6710 train_time:281993ms step_avg:220.48ms step:1280/6710 train_time:282215ms step_avg:220.48ms step:1281/6710 train_time:282436ms step_avg:220.48ms step:1282/6710 train_time:282657ms step_avg:220.48ms step:1283/6710 train_time:282879ms step_avg:220.48ms step:1284/6710 train_time:283101ms step_avg:220.48ms step:1285/6710 train_time:283323ms step_avg:220.48ms step:1286/6710 train_time:283544ms step_avg:220.49ms step:1287/6710 train_time:283764ms step_avg:220.49ms step:1288/6710 train_time:283985ms step_avg:220.49ms step:1289/6710 train_time:284207ms step_avg:220.49ms step:1290/6710 train_time:284427ms step_avg:220.49ms step:1291/6710 train_time:284647ms step_avg:220.49ms step:1292/6710 train_time:284867ms step_avg:220.49ms step:1293/6710 train_time:285090ms step_avg:220.49ms step:1294/6710 train_time:285310ms step_avg:220.49ms step:1295/6710 train_time:285532ms step_avg:220.49ms step:1296/6710 train_time:285752ms step_avg:220.49ms step:1297/6710 train_time:285973ms step_avg:220.49ms step:1298/6710 train_time:286195ms step_avg:220.49ms step:1299/6710 train_time:286417ms step_avg:220.49ms step:1300/6710 train_time:286640ms step_avg:220.49ms step:1301/6710 train_time:286861ms step_avg:220.49ms step:1302/6710 train_time:287084ms step_avg:220.49ms step:1303/6710 train_time:287306ms step_avg:220.50ms step:1304/6710 train_time:287528ms step_avg:220.50ms step:1305/6710 train_time:287748ms step_avg:220.50ms step:1306/6710 train_time:287967ms step_avg:220.50ms step:1307/6710 train_time:288190ms step_avg:220.50ms step:1308/6710 train_time:288411ms step_avg:220.50ms step:1309/6710 train_time:288634ms step_avg:220.50ms step:1310/6710 train_time:288854ms step_avg:220.50ms step:1311/6710 train_time:289076ms step_avg:220.50ms step:1312/6710 train_time:289298ms step_avg:220.50ms step:1313/6710 train_time:289520ms step_avg:220.50ms step:1314/6710 train_time:289742ms step_avg:220.50ms step:1315/6710 train_time:289962ms step_avg:220.50ms step:1316/6710 train_time:290184ms step_avg:220.50ms step:1317/6710 train_time:290407ms step_avg:220.51ms step:1318/6710 train_time:290629ms step_avg:220.51ms step:1319/6710 train_time:290849ms step_avg:220.51ms step:1320/6710 train_time:291069ms step_avg:220.51ms step:1321/6710 train_time:291290ms step_avg:220.51ms step:1322/6710 train_time:291511ms step_avg:220.51ms step:1323/6710 train_time:291733ms step_avg:220.51ms step:1324/6710 train_time:291954ms step_avg:220.51ms step:1325/6710 train_time:292176ms step_avg:220.51ms step:1326/6710 train_time:292400ms step_avg:220.51ms step:1327/6710 train_time:292624ms step_avg:220.52ms step:1328/6710 train_time:292845ms step_avg:220.52ms step:1329/6710 train_time:293067ms step_avg:220.52ms step:1330/6710 train_time:293287ms step_avg:220.52ms step:1331/6710 train_time:293508ms step_avg:220.52ms step:1332/6710 train_time:293728ms step_avg:220.52ms step:1333/6710 train_time:293948ms step_avg:220.52ms step:1334/6710 train_time:294168ms step_avg:220.52ms step:1335/6710 train_time:294388ms step_avg:220.52ms step:1336/6710 train_time:294609ms step_avg:220.52ms step:1337/6710 train_time:294830ms step_avg:220.52ms step:1338/6710 train_time:295050ms step_avg:220.52ms step:1339/6710 train_time:295270ms step_avg:220.52ms step:1340/6710 train_time:295491ms step_avg:220.52ms step:1341/6710 train_time:295713ms step_avg:220.52ms step:1342/6710 train_time:295934ms step_avg:220.52ms step:1343/6710 train_time:296155ms step_avg:220.52ms step:1344/6710 train_time:296377ms step_avg:220.52ms step:1345/6710 train_time:296599ms step_avg:220.52ms step:1346/6710 train_time:296822ms step_avg:220.52ms step:1347/6710 train_time:297044ms step_avg:220.52ms step:1348/6710 train_time:297265ms step_avg:220.52ms step:1349/6710 train_time:297487ms step_avg:220.52ms step:1350/6710 train_time:297708ms step_avg:220.52ms step:1351/6710 train_time:297928ms step_avg:220.52ms step:1352/6710 train_time:298149ms step_avg:220.52ms step:1353/6710 train_time:298370ms step_avg:220.52ms step:1354/6710 train_time:298593ms step_avg:220.53ms step:1355/6710 train_time:298815ms step_avg:220.53ms step:1356/6710 train_time:299037ms step_avg:220.53ms step:1357/6710 train_time:299258ms step_avg:220.53ms step:1358/6710 train_time:299481ms step_avg:220.53ms step:1359/6710 train_time:299702ms step_avg:220.53ms step:1360/6710 train_time:299924ms step_avg:220.53ms step:1361/6710 train_time:300145ms step_avg:220.53ms step:1362/6710 train_time:300366ms step_avg:220.53ms step:1363/6710 train_time:300588ms step_avg:220.53ms step:1364/6710 train_time:300809ms step_avg:220.53ms step:1365/6710 train_time:301029ms step_avg:220.53ms step:1366/6710 train_time:301250ms step_avg:220.53ms step:1367/6710 train_time:301470ms step_avg:220.53ms step:1368/6710 train_time:301690ms step_avg:220.53ms step:1369/6710 train_time:301910ms step_avg:220.53ms step:1370/6710 train_time:302132ms step_avg:220.53ms step:1371/6710 train_time:302352ms step_avg:220.53ms step:1372/6710 train_time:302573ms step_avg:220.53ms step:1373/6710 train_time:302794ms step_avg:220.53ms step:1374/6710 train_time:303017ms step_avg:220.54ms step:1375/6710 train_time:303238ms step_avg:220.54ms step:1375/6710 val_loss:3.379539 train_time:303413ms step_avg:220.66ms Parameter containing: tensor([1.0000, 1.0000, 0.4077, 1.0000, 0.8003, 1.0000, 0.5998, 1.0000], device='cuda:0', requires_grad=True) 0 [4.269767761230469, 3.2697651386260986] 1 [0.7153313159942627, 3.143454074859619] 2 [0.918975830078125, 2.6102232933044434] 3 [0.6324489116668701, 1.924267292022705] 4 [0.26129183173179626, 1.5245970487594604] 5 [0.9302480816841125, 2.3998842239379883] 6 [0.5827438831329346, 2.258862018585205] 7 [0.8369877934455872, 3.33524751663208] 8 [0.40255382657051086, 1.6283564567565918] 9 [0.547019362449646, 2.100329875946045] 10 [0.6625146865844727, 2.203977346420288] 11 [0.42013487219810486, 2.172938585281372] 12 [1.1812046766281128, 3.2955822944641113] 13 [1.1105233430862427, 2.310349464416504] 14 [0.9550685882568359, 1.9649213552474976] 15 [0.7346623539924622, 1.7820073366165161] 0 [7.520759582519531, 15.929862022399902, 15.599212646484375] 1 [22.20950698852539, 15.842622756958008, 35.19618606567383] 2 [49.91110610961914, 14.664288520812988, 18.92940902709961] 3 [41.337833404541016, 15.886796951293945, 22.170387268066406] 4 [16.62940788269043, 15.752031326293945, 13.00510025024414] 5 [33.266761779785156, 13.503043174743652, 21.83572769165039] 6 [31.93194007873535, 15.629902839660645, 17.855066299438477] 7 [44.0190544128418, 0.0, 31.855804443359375] 8 [26.095211029052734, 18.120941162109375, 28.7309627532959] 9 [45.40310287475586, 14.795255661010742, 22.514341354370117] 10 [58.76200485229492, 11.717400550842285, 19.531211853027344] 11 [40.02079391479492, 18.938417434692383, 10.684234619140625] 12 [68.89804077148438, 11.828568458557129, 14.774785995483398] 13 [91.3319320678711, 13.198575019836426, 19.795650482177734] 14 [98.02123260498047, 15.361611366271973, 26.708507537841797] 15 [81.96690368652344, 46.39628982543945, 62.34980010986328] step:1376/6710 train_time:303461ms step_avg:220.54ms step:1377/6710 train_time:303678ms step_avg:220.54ms step:1378/6710 train_time:303903ms step_avg:220.54ms step:1379/6710 train_time:304123ms step_avg:220.54ms step:1380/6710 train_time:304343ms step_avg:220.54ms step:1381/6710 train_time:304568ms step_avg:220.54ms step:1382/6710 train_time:304789ms step_avg:220.54ms step:1383/6710 train_time:305012ms step_avg:220.54ms step:1384/6710 train_time:305233ms step_avg:220.54ms step:1385/6710 train_time:305454ms step_avg:220.54ms step:1386/6710 train_time:305675ms step_avg:220.54ms step:1387/6710 train_time:305898ms step_avg:220.55ms step:1388/6710 train_time:306119ms step_avg:220.55ms step:1389/6710 train_time:306341ms step_avg:220.55ms step:1390/6710 train_time:306562ms step_avg:220.55ms step:1391/6710 train_time:306784ms step_avg:220.55ms step:1392/6710 train_time:307007ms step_avg:220.55ms step:1393/6710 train_time:307229ms step_avg:220.55ms step:1394/6710 train_time:307451ms step_avg:220.55ms step:1395/6710 train_time:307672ms step_avg:220.55ms step:1396/6710 train_time:307893ms step_avg:220.55ms step:1397/6710 train_time:308114ms step_avg:220.55ms step:1398/6710 train_time:308335ms step_avg:220.55ms step:1399/6710 train_time:308555ms step_avg:220.55ms step:1400/6710 train_time:308776ms step_avg:220.55ms step:1401/6710 train_time:308996ms step_avg:220.55ms step:1402/6710 train_time:309217ms step_avg:220.55ms step:1403/6710 train_time:309437ms step_avg:220.55ms step:1404/6710 train_time:309658ms step_avg:220.55ms step:1405/6710 train_time:309879ms step_avg:220.55ms step:1406/6710 train_time:310099ms step_avg:220.55ms step:1407/6710 train_time:310321ms step_avg:220.56ms step:1408/6710 train_time:310542ms step_avg:220.56ms step:1409/6710 train_time:310763ms step_avg:220.56ms step:1410/6710 train_time:310985ms step_avg:220.56ms step:1411/6710 train_time:311207ms step_avg:220.56ms step:1412/6710 train_time:311429ms step_avg:220.56ms step:1413/6710 train_time:311650ms step_avg:220.56ms step:1414/6710 train_time:311871ms step_avg:220.56ms step:1415/6710 train_time:312092ms step_avg:220.56ms step:1416/6710 train_time:312314ms step_avg:220.56ms step:1417/6710 train_time:312535ms step_avg:220.56ms step:1418/6710 train_time:312757ms step_avg:220.56ms step:1419/6710 train_time:312977ms step_avg:220.56ms step:1420/6710 train_time:313197ms step_avg:220.56ms step:1421/6710 train_time:313418ms step_avg:220.56ms step:1422/6710 train_time:313639ms step_avg:220.56ms step:1423/6710 train_time:313859ms step_avg:220.56ms step:1424/6710 train_time:314080ms step_avg:220.56ms step:1425/6710 train_time:314301ms step_avg:220.56ms step:1426/6710 train_time:314523ms step_avg:220.56ms step:1427/6710 train_time:314745ms step_avg:220.56ms step:1428/6710 train_time:314966ms step_avg:220.56ms step:1429/6710 train_time:315187ms step_avg:220.56ms step:1430/6710 train_time:315410ms step_avg:220.57ms step:1431/6710 train_time:315633ms step_avg:220.57ms step:1432/6710 train_time:315854ms step_avg:220.57ms step:1433/6710 train_time:316074ms step_avg:220.57ms step:1434/6710 train_time:316295ms step_avg:220.57ms step:1435/6710 train_time:316517ms step_avg:220.57ms step:1436/6710 train_time:316738ms step_avg:220.57ms step:1437/6710 train_time:316958ms step_avg:220.57ms step:1438/6710 train_time:317178ms step_avg:220.57ms step:1439/6710 train_time:317400ms step_avg:220.57ms step:1440/6710 train_time:317621ms step_avg:220.57ms step:1441/6710 train_time:317843ms step_avg:220.57ms step:1442/6710 train_time:318065ms step_avg:220.57ms step:1443/6710 train_time:318287ms step_avg:220.57ms step:1444/6710 train_time:318511ms step_avg:220.58ms step:1445/6710 train_time:318732ms step_avg:220.58ms step:1446/6710 train_time:318954ms step_avg:220.58ms step:1447/6710 train_time:319173ms step_avg:220.58ms step:1448/6710 train_time:319394ms step_avg:220.58ms step:1449/6710 train_time:319616ms step_avg:220.58ms step:1450/6710 train_time:319838ms step_avg:220.58ms step:1451/6710 train_time:320058ms step_avg:220.58ms step:1452/6710 train_time:320278ms step_avg:220.58ms step:1453/6710 train_time:320499ms step_avg:220.58ms step:1454/6710 train_time:320721ms step_avg:220.58ms step:1455/6710 train_time:320942ms step_avg:220.58ms step:1456/6710 train_time:321163ms step_avg:220.58ms step:1457/6710 train_time:321384ms step_avg:220.58ms step:1458/6710 train_time:321606ms step_avg:220.58ms step:1459/6710 train_time:321830ms step_avg:220.58ms step:1460/6710 train_time:322052ms step_avg:220.58ms step:1461/6710 train_time:322272ms step_avg:220.58ms step:1462/6710 train_time:322493ms step_avg:220.58ms step:1463/6710 train_time:322715ms step_avg:220.58ms step:1464/6710 train_time:322936ms step_avg:220.58ms step:1465/6710 train_time:323157ms step_avg:220.58ms step:1466/6710 train_time:323377ms step_avg:220.58ms step:1467/6710 train_time:323599ms step_avg:220.59ms step:1468/6710 train_time:323820ms step_avg:220.59ms step:1469/6710 train_time:324042ms step_avg:220.59ms step:1470/6710 train_time:324262ms step_avg:220.59ms step:1471/6710 train_time:324484ms step_avg:220.59ms step:1472/6710 train_time:324707ms step_avg:220.59ms step:1473/6710 train_time:324928ms step_avg:220.59ms step:1474/6710 train_time:325150ms step_avg:220.59ms step:1475/6710 train_time:325372ms step_avg:220.59ms step:1476/6710 train_time:325595ms step_avg:220.59ms step:1477/6710 train_time:325815ms step_avg:220.59ms step:1478/6710 train_time:326035ms step_avg:220.59ms step:1479/6710 train_time:326256ms step_avg:220.59ms step:1480/6710 train_time:326477ms step_avg:220.59ms step:1481/6710 train_time:326698ms step_avg:220.59ms step:1482/6710 train_time:326919ms step_avg:220.59ms step:1483/6710 train_time:327140ms step_avg:220.59ms step:1484/6710 train_time:327360ms step_avg:220.59ms step:1485/6710 train_time:327582ms step_avg:220.59ms step:1486/6710 train_time:327804ms step_avg:220.60ms step:1487/6710 train_time:328028ms step_avg:220.60ms step:1488/6710 train_time:328250ms step_avg:220.60ms step:1489/6710 train_time:328471ms step_avg:220.60ms step:1490/6710 train_time:328693ms step_avg:220.60ms step:1491/6710 train_time:328915ms step_avg:220.60ms step:1492/6710 train_time:329136ms step_avg:220.60ms step:1493/6710 train_time:329357ms step_avg:220.60ms step:1494/6710 train_time:329582ms step_avg:220.60ms step:1495/6710 train_time:329808ms step_avg:220.61ms step:1496/6710 train_time:330037ms step_avg:220.61ms step:1497/6710 train_time:330262ms step_avg:220.62ms step:1498/6710 train_time:330488ms step_avg:220.62ms step:1499/6710 train_time:330715ms step_avg:220.62ms step:1500/6710 train_time:330941ms step_avg:220.63ms step:1500/6710 val_loss:3.332108 train_time:331121ms step_avg:220.75ms Parameter containing: tensor([1.0000, 1.0000, 0.4204, 1.0000, 0.7881, 1.0000, 0.5796, 1.0000], device='cuda:0', requires_grad=True) 0 [4.501767635345459, 3.5017635822296143] 1 [0.7008436918258667, 3.3515231609344482] 2 [0.9256706237792969, 2.7744476795196533] 3 [0.6397372484207153, 2.0723352432250977] 4 [0.2836114168167114, 1.5880663394927979] 5 [0.8847246766090393, 2.5616397857666016] 6 [0.567281186580658, 2.368133544921875] 7 [0.8679960370063782, 3.551424980163574] 8 [0.3880561888217926, 1.6025687456130981] 9 [0.5502011179924011, 2.154813289642334] 10 [0.6686618328094482, 2.2638838291168213] 11 [0.42019546031951904, 2.2295796871185303] 12 [1.1669765710830688, 3.57502818107605] 13 [1.1001482009887695, 2.463340997695923] 14 [0.9576259851455688, 1.992436170578003] 15 [0.7454551458358765, 1.7994105815887451] 0 [7.988635063171387, 17.215591430664062, 16.44760513305664] 1 [23.21832847595215, 16.93397331237793, 41.0661735534668] 2 [55.70256805419922, 14.990413665771484, 19.71050262451172] 3 [45.4450798034668, 17.21469497680664, 22.936189651489258] 4 [19.310029983520508, 17.28574562072754, 13.659333229064941] 5 [35.31432342529297, 14.298598289489746, 23.057907104492188] 6 [32.89436340332031, 16.426708221435547, 18.659954071044922] 7 [47.24552536010742, 0.0, 33.0806884765625] 8 [26.66727638244629, 18.947921752929688, 29.73819351196289] 9 [46.606956481933594, 15.810996055603027, 23.837299346923828] 10 [62.55326843261719, 12.511007308959961, 20.912782669067383] 11 [43.07362747192383, 20.73332977294922, 11.119253158569336] 12 [73.5809555053711, 12.62125015258789, 15.24975872039795] 13 [96.47267150878906, 13.506917953491211, 20.636171340942383] 14 [103.58844757080078, 15.983616828918457, 29.045167922973633] 15 [87.89362335205078, 51.12504959106445, 68.03008270263672] step:1501/6710 train_time:331170ms step_avg:220.63ms step:1502/6710 train_time:331392ms step_avg:220.63ms step:1503/6710 train_time:331622ms step_avg:220.64ms step:1504/6710 train_time:331847ms step_avg:220.64ms step:1505/6710 train_time:332075ms step_avg:220.65ms step:1506/6710 train_time:332302ms step_avg:220.65ms step:1507/6710 train_time:332530ms step_avg:220.66ms step:1508/6710 train_time:332758ms step_avg:220.66ms step:1509/6710 train_time:332984ms step_avg:220.67ms step:1510/6710 train_time:333210ms step_avg:220.67ms step:1511/6710 train_time:333437ms step_avg:220.67ms step:1512/6710 train_time:333663ms step_avg:220.68ms step:1513/6710 train_time:333890ms step_avg:220.68ms step:1514/6710 train_time:334117ms step_avg:220.68ms step:1515/6710 train_time:334341ms step_avg:220.69ms step:1516/6710 train_time:334567ms step_avg:220.69ms step:1517/6710 train_time:334796ms step_avg:220.70ms step:1518/6710 train_time:335021ms step_avg:220.70ms step:1519/6710 train_time:335248ms step_avg:220.70ms step:1520/6710 train_time:335475ms step_avg:220.71ms step:1521/6710 train_time:335703ms step_avg:220.71ms step:1522/6710 train_time:335930ms step_avg:220.72ms step:1523/6710 train_time:336158ms step_avg:220.72ms step:1524/6710 train_time:336383ms step_avg:220.72ms step:1525/6710 train_time:336610ms step_avg:220.73ms step:1526/6710 train_time:336836ms step_avg:220.73ms step:1527/6710 train_time:337062ms step_avg:220.73ms step:1528/6710 train_time:337288ms step_avg:220.74ms step:1529/6710 train_time:337516ms step_avg:220.74ms step:1530/6710 train_time:337742ms step_avg:220.75ms step:1531/6710 train_time:337967ms step_avg:220.75ms step:1532/6710 train_time:338194ms step_avg:220.75ms step:1533/6710 train_time:338419ms step_avg:220.76ms step:1534/6710 train_time:338645ms step_avg:220.76ms step:1535/6710 train_time:338872ms step_avg:220.76ms step:1536/6710 train_time:339099ms step_avg:220.77ms step:1537/6710 train_time:339323ms step_avg:220.77ms step:1538/6710 train_time:339549ms step_avg:220.77ms step:1539/6710 train_time:339776ms step_avg:220.78ms step:1540/6710 train_time:340002ms step_avg:220.78ms step:1541/6710 train_time:340228ms step_avg:220.78ms step:1542/6710 train_time:340455ms step_avg:220.79ms step:1543/6710 train_time:340680ms step_avg:220.79ms step:1544/6710 train_time:340906ms step_avg:220.79ms step:1545/6710 train_time:341134ms step_avg:220.80ms step:1546/6710 train_time:341360ms step_avg:220.80ms step:1547/6710 train_time:341587ms step_avg:220.81ms step:1548/6710 train_time:341813ms step_avg:220.81ms step:1549/6710 train_time:342038ms step_avg:220.81ms step:1550/6710 train_time:342265ms step_avg:220.82ms step:1551/6710 train_time:342492ms step_avg:220.82ms step:1552/6710 train_time:342718ms step_avg:220.82ms step:1553/6710 train_time:342945ms step_avg:220.83ms step:1554/6710 train_time:343170ms step_avg:220.83ms step:1555/6710 train_time:343398ms step_avg:220.83ms step:1556/6710 train_time:343624ms step_avg:220.84ms step:1557/6710 train_time:343850ms step_avg:220.84ms step:1558/6710 train_time:344078ms step_avg:220.85ms step:1559/6710 train_time:344304ms step_avg:220.85ms step:1560/6710 train_time:344531ms step_avg:220.85ms step:1561/6710 train_time:344757ms step_avg:220.86ms step:1562/6710 train_time:344983ms step_avg:220.86ms step:1563/6710 train_time:345210ms step_avg:220.86ms step:1564/6710 train_time:345436ms step_avg:220.87ms step:1565/6710 train_time:345663ms step_avg:220.87ms step:1566/6710 train_time:345890ms step_avg:220.87ms step:1567/6710 train_time:346117ms step_avg:220.88ms step:1568/6710 train_time:346342ms step_avg:220.88ms step:1569/6710 train_time:346568ms step_avg:220.88ms step:1570/6710 train_time:346796ms step_avg:220.89ms step:1571/6710 train_time:347022ms step_avg:220.89ms step:1572/6710 train_time:347249ms step_avg:220.90ms step:1573/6710 train_time:347477ms step_avg:220.90ms step:1574/6710 train_time:347701ms step_avg:220.90ms step:1575/6710 train_time:347928ms step_avg:220.91ms step:1576/6710 train_time:348154ms step_avg:220.91ms step:1577/6710 train_time:348380ms step_avg:220.91ms step:1578/6710 train_time:348606ms step_avg:220.92ms step:1579/6710 train_time:348833ms step_avg:220.92ms step:1580/6710 train_time:349060ms step_avg:220.92ms step:1581/6710 train_time:349285ms step_avg:220.93ms step:1582/6710 train_time:349512ms step_avg:220.93ms step:1583/6710 train_time:349739ms step_avg:220.93ms step:1584/6710 train_time:349964ms step_avg:220.94ms step:1585/6710 train_time:350190ms step_avg:220.94ms step:1586/6710 train_time:350415ms step_avg:220.94ms step:1587/6710 train_time:350640ms step_avg:220.95ms step:1588/6710 train_time:350866ms step_avg:220.95ms step:1589/6710 train_time:351094ms step_avg:220.95ms step:1590/6710 train_time:351319ms step_avg:220.96ms step:1591/6710 train_time:351545ms step_avg:220.96ms step:1592/6710 train_time:351772ms step_avg:220.96ms step:1593/6710 train_time:351997ms step_avg:220.97ms step:1594/6710 train_time:352223ms step_avg:220.97ms step:1595/6710 train_time:352450ms step_avg:220.97ms step:1596/6710 train_time:352676ms step_avg:220.97ms step:1597/6710 train_time:352903ms step_avg:220.98ms step:1598/6710 train_time:353129ms step_avg:220.98ms step:1599/6710 train_time:353356ms step_avg:220.99ms step:1600/6710 train_time:353580ms step_avg:220.99ms step:1601/6710 train_time:353806ms step_avg:220.99ms step:1602/6710 train_time:354034ms step_avg:221.00ms step:1603/6710 train_time:354260ms step_avg:221.00ms step:1604/6710 train_time:354486ms step_avg:221.00ms step:1605/6710 train_time:354712ms step_avg:221.00ms step:1606/6710 train_time:354938ms step_avg:221.01ms step:1607/6710 train_time:355164ms step_avg:221.01ms step:1608/6710 train_time:355391ms step_avg:221.01ms step:1609/6710 train_time:355618ms step_avg:221.02ms step:1610/6710 train_time:355845ms step_avg:221.02ms step:1611/6710 train_time:356072ms step_avg:221.03ms step:1612/6710 train_time:356298ms step_avg:221.03ms step:1613/6710 train_time:356523ms step_avg:221.03ms step:1614/6710 train_time:356747ms step_avg:221.03ms step:1615/6710 train_time:356972ms step_avg:221.04ms step:1616/6710 train_time:357199ms step_avg:221.04ms step:1617/6710 train_time:357425ms step_avg:221.04ms step:1618/6710 train_time:357651ms step_avg:221.04ms step:1619/6710 train_time:357878ms step_avg:221.05ms step:1620/6710 train_time:358105ms step_avg:221.05ms step:1621/6710 train_time:358331ms step_avg:221.06ms step:1622/6710 train_time:358558ms step_avg:221.06ms step:1623/6710 train_time:358783ms step_avg:221.06ms step:1624/6710 train_time:359011ms step_avg:221.07ms step:1625/6710 train_time:359237ms step_avg:221.07ms step:1625/6710 val_loss:3.310216 train_time:359414ms step_avg:221.18ms Parameter containing: tensor([1.0000, 1.0000, 0.4147, 1.0000, 0.7285, 1.0000, 0.5895, 1.0000], device='cuda:0', requires_grad=True) 0 [4.760634899139404, 3.7606334686279297] 1 [0.6473170518875122, 3.6527256965637207] 2 [0.9013830423355103, 3.020909309387207] 3 [0.6469859480857849, 2.2695863246917725] 4 [0.295980304479599, 1.7321662902832031] 5 [0.845492959022522, 2.7279856204986572] 6 [0.5384994745254517, 2.5046544075012207] 7 [0.8620471358299255, 3.8055038452148438] 8 [0.3811820447444916, 1.682830572128296] 9 [0.5416708588600159, 2.2835233211517334] 10 [0.6623947620391846, 2.3964216709136963] 11 [0.4458443224430084, 2.361795663833618] 12 [1.1090952157974243, 3.831545114517212] 13 [1.0965394973754883, 2.562105894088745] 14 [0.9672178626060486, 1.9908397197723389] 15 [0.7613324522972107, 1.751586675643921] 0 [8.504661560058594, 18.253738403320312, 17.7988224029541] 1 [23.227294921875, 18.169654846191406, 42.246437072753906] 2 [55.711334228515625, 16.40200424194336, 21.36931037902832] 3 [47.14982986450195, 18.879053115844727, 24.599285125732422] 4 [21.155210494995117, 18.2236328125, 16.033981323242188] 5 [37.04435348510742, 16.110944747924805, 25.447805404663086] 6 [33.70867156982422, 18.276138305664062, 19.808277130126953] 7 [49.373565673828125, 0.0, 35.842628479003906] 8 [27.836633682250977, 20.92072296142578, 31.565549850463867] 9 [48.80202102661133, 17.48360252380371, 25.581892013549805] 10 [64.79448699951172, 14.365492820739746, 22.65503692626953] 11 [47.44607162475586, 21.956310272216797, 12.611809730529785] 12 [76.71031188964844, 14.402392387390137, 16.236698150634766] 13 [101.13080596923828, 15.444390296936035, 21.85451889038086] 14 [110.06299591064453, 18.23345375061035, 30.760543823242188] 15 [95.64259338378906, 55.74564743041992, 75.10340881347656] step:1626/6710 train_time:359463ms step_avg:221.07ms step:1627/6710 train_time:359687ms step_avg:221.07ms step:1628/6710 train_time:359921ms step_avg:221.08ms step:1629/6710 train_time:360147ms step_avg:221.08ms step:1630/6710 train_time:360372ms step_avg:221.09ms step:1631/6710 train_time:360599ms step_avg:221.09ms step:1632/6710 train_time:360826ms step_avg:221.09ms step:1633/6710 train_time:361055ms step_avg:221.10ms step:1634/6710 train_time:361279ms step_avg:221.10ms step:1635/6710 train_time:361504ms step_avg:221.10ms step:1636/6710 train_time:361731ms step_avg:221.11ms step:1637/6710 train_time:361959ms step_avg:221.11ms step:1638/6710 train_time:362186ms step_avg:221.11ms step:1639/6710 train_time:362413ms step_avg:221.12ms step:1640/6710 train_time:362638ms step_avg:221.12ms step:1641/6710 train_time:362864ms step_avg:221.12ms step:1642/6710 train_time:363091ms step_avg:221.13ms step:1643/6710 train_time:363316ms step_avg:221.13ms step:1644/6710 train_time:363541ms step_avg:221.13ms step:1645/6710 train_time:363768ms step_avg:221.14ms step:1646/6710 train_time:363995ms step_avg:221.14ms step:1647/6710 train_time:364221ms step_avg:221.14ms step:1648/6710 train_time:364446ms step_avg:221.14ms step:1649/6710 train_time:364672ms step_avg:221.15ms step:1650/6710 train_time:364899ms step_avg:221.15ms step:1651/6710 train_time:365127ms step_avg:221.16ms step:1652/6710 train_time:365354ms step_avg:221.16ms step:1653/6710 train_time:365578ms step_avg:221.16ms step:1654/6710 train_time:365804ms step_avg:221.16ms step:1655/6710 train_time:366033ms step_avg:221.17ms step:1656/6710 train_time:366259ms step_avg:221.17ms step:1657/6710 train_time:366484ms step_avg:221.17ms step:1658/6710 train_time:366711ms step_avg:221.18ms step:1659/6710 train_time:366938ms step_avg:221.18ms step:1660/6710 train_time:367164ms step_avg:221.18ms step:1661/6710 train_time:367391ms step_avg:221.19ms step:1662/6710 train_time:367617ms step_avg:221.19ms step:1663/6710 train_time:367842ms step_avg:221.19ms step:1664/6710 train_time:368070ms step_avg:221.20ms step:1665/6710 train_time:368297ms step_avg:221.20ms step:1666/6710 train_time:368523ms step_avg:221.20ms step:1667/6710 train_time:368749ms step_avg:221.21ms step:1668/6710 train_time:368977ms step_avg:221.21ms step:1669/6710 train_time:369202ms step_avg:221.21ms step:1670/6710 train_time:369429ms step_avg:221.22ms step:1671/6710 train_time:369657ms step_avg:221.22ms step:1672/6710 train_time:369884ms step_avg:221.22ms step:1673/6710 train_time:370111ms step_avg:221.23ms step:1674/6710 train_time:370337ms step_avg:221.23ms step:1675/6710 train_time:370563ms step_avg:221.23ms step:1676/6710 train_time:370789ms step_avg:221.23ms step:1677/6710 train_time:371016ms step_avg:221.24ms step:1678/6710 train_time:371240ms step_avg:221.24ms step:1679/6710 train_time:371467ms step_avg:221.24ms step:1680/6710 train_time:371694ms step_avg:221.25ms step:1681/6710 train_time:371921ms step_avg:221.25ms step:1682/6710 train_time:372149ms step_avg:221.25ms step:1683/6710 train_time:372374ms step_avg:221.26ms step:1684/6710 train_time:372599ms step_avg:221.26ms step:1685/6710 train_time:372825ms step_avg:221.26ms step:1686/6710 train_time:373053ms step_avg:221.27ms step:1687/6710 train_time:373278ms step_avg:221.27ms step:1688/6710 train_time:373504ms step_avg:221.27ms step:1689/6710 train_time:373730ms step_avg:221.27ms step:1690/6710 train_time:373957ms step_avg:221.28ms step:1691/6710 train_time:374183ms step_avg:221.28ms step:1692/6710 train_time:374410ms step_avg:221.28ms step:1693/6710 train_time:374637ms step_avg:221.29ms step:1694/6710 train_time:374862ms step_avg:221.29ms step:1695/6710 train_time:375088ms step_avg:221.29ms step:1696/6710 train_time:375314ms step_avg:221.29ms step:1697/6710 train_time:375538ms step_avg:221.30ms step:1698/6710 train_time:375764ms step_avg:221.30ms step:1699/6710 train_time:375992ms step_avg:221.30ms step:1700/6710 train_time:376218ms step_avg:221.30ms step:1701/6710 train_time:376444ms step_avg:221.31ms step:1702/6710 train_time:376670ms step_avg:221.31ms step:1703/6710 train_time:376899ms step_avg:221.31ms step:1704/6710 train_time:377125ms step_avg:221.32ms step:1705/6710 train_time:377352ms step_avg:221.32ms step:1706/6710 train_time:377577ms step_avg:221.32ms step:1707/6710 train_time:377804ms step_avg:221.33ms step:1708/6710 train_time:378030ms step_avg:221.33ms step:1709/6710 train_time:378258ms step_avg:221.33ms step:1710/6710 train_time:378483ms step_avg:221.34ms step:1711/6710 train_time:378710ms step_avg:221.34ms step:1712/6710 train_time:378937ms step_avg:221.34ms step:1713/6710 train_time:379163ms step_avg:221.34ms step:1714/6710 train_time:379389ms step_avg:221.35ms step:1715/6710 train_time:379614ms step_avg:221.35ms step:1716/6710 train_time:379841ms step_avg:221.35ms step:1717/6710 train_time:380068ms step_avg:221.36ms step:1718/6710 train_time:380294ms step_avg:221.36ms step:1719/6710 train_time:380518ms step_avg:221.36ms step:1720/6710 train_time:380744ms step_avg:221.36ms step:1721/6710 train_time:380970ms step_avg:221.37ms step:1722/6710 train_time:381196ms step_avg:221.37ms step:1723/6710 train_time:381421ms step_avg:221.37ms step:1724/6710 train_time:381647ms step_avg:221.37ms step:1725/6710 train_time:381873ms step_avg:221.38ms step:1726/6710 train_time:382101ms step_avg:221.38ms step:1727/6710 train_time:382327ms step_avg:221.38ms step:1728/6710 train_time:382554ms step_avg:221.39ms step:1729/6710 train_time:382780ms step_avg:221.39ms step:1730/6710 train_time:383007ms step_avg:221.39ms step:1731/6710 train_time:383235ms step_avg:221.40ms step:1732/6710 train_time:383461ms step_avg:221.40ms step:1733/6710 train_time:383686ms step_avg:221.40ms step:1734/6710 train_time:383913ms step_avg:221.40ms step:1735/6710 train_time:384140ms step_avg:221.41ms step:1736/6710 train_time:384365ms step_avg:221.41ms step:1737/6710 train_time:384593ms step_avg:221.41ms step:1738/6710 train_time:384818ms step_avg:221.41ms step:1739/6710 train_time:385044ms step_avg:221.42ms step:1740/6710 train_time:385270ms step_avg:221.42ms step:1741/6710 train_time:385496ms step_avg:221.42ms step:1742/6710 train_time:385723ms step_avg:221.43ms step:1743/6710 train_time:385949ms step_avg:221.43ms step:1744/6710 train_time:386175ms step_avg:221.43ms step:1745/6710 train_time:386398ms step_avg:221.43ms step:1746/6710 train_time:386626ms step_avg:221.44ms step:1747/6710 train_time:386852ms step_avg:221.44ms step:1748/6710 train_time:387079ms step_avg:221.44ms step:1749/6710 train_time:387306ms step_avg:221.44ms step:1750/6710 train_time:387533ms step_avg:221.45ms step:1750/6710 val_loss:3.291387 train_time:387710ms step_avg:221.55ms Parameter containing: tensor([1.0000, 1.0000, 0.4116, 1.0000, 0.6974, 1.0000, 0.5815, 1.0000], device='cuda:0', requires_grad=True) 0 [5.003294467926025, 4.003292560577393] 1 [0.6328554749488831, 3.944999933242798] 2 [0.890843391418457, 3.2421224117279053] 3 [0.6579564809799194, 2.444551467895508] 4 [0.30039364099502563, 1.8365422487258911] 5 [0.8362153172492981, 2.885352373123169] 6 [0.5322458744049072, 2.624174118041992] 7 [0.8602120280265808, 4.075568675994873] 8 [0.389273077249527, 1.7305052280426025] 9 [0.5349991917610168, 2.3538739681243896] 10 [0.662344217300415, 2.4915080070495605] 11 [0.4479343593120575, 2.447035551071167] 12 [1.084272027015686, 4.084342002868652] 13 [1.0942808389663696, 2.7041828632354736] 14 [0.9708521366119385, 2.043639659881592] 15 [0.7702471017837524, 1.7628469467163086] 0 [8.990888595581055, 19.42599105834961, 19.30567169189453] 1 [24.299806594848633, 19.300989151000977, 46.843544006347656] 2 [59.61945724487305, 17.33713722229004, 22.748619079589844] 3 [51.022945404052734, 20.112672805786133, 26.424461364746094] 4 [23.017833709716797, 19.250030517578125, 17.21893882751465] 5 [39.16239929199219, 17.533361434936523, 27.022756576538086] 6 [35.342124938964844, 19.766685485839844, 20.6024112701416] 7 [51.83122253417969, 0.0, 37.49116516113281] 8 [29.707582473754883, 22.335784912109375, 33.566558837890625] 9 [50.83638000488281, 18.9527587890625, 27.23914909362793] 10 [67.57366180419922, 15.876362800598145, 24.191661834716797] 11 [50.16286087036133, 23.26494598388672, 13.682120323181152] 12 [79.62704467773438, 15.72052001953125, 17.321548461914062] 13 [105.62239074707031, 16.740581512451172, 23.534034729003906] 14 [116.0408935546875, 19.754932403564453, 34.0235710144043] 15 [102.89373016357422, 59.748260498046875, 85.81492614746094] step:1751/6710 train_time:387758ms step_avg:221.45ms step:1752/6710 train_time:387999ms step_avg:221.46ms step:1753/6710 train_time:388221ms step_avg:221.46ms step:1754/6710 train_time:388444ms step_avg:221.46ms step:1755/6710 train_time:388669ms step_avg:221.46ms step:1756/6710 train_time:388899ms step_avg:221.47ms step:1757/6710 train_time:389126ms step_avg:221.47ms step:1758/6710 train_time:389350ms step_avg:221.47ms step:1759/6710 train_time:389575ms step_avg:221.48ms step:1760/6710 train_time:389801ms step_avg:221.48ms step:1761/6710 train_time:390029ms step_avg:221.48ms step:1762/6710 train_time:390255ms step_avg:221.48ms step:1763/6710 train_time:390480ms step_avg:221.49ms step:1764/6710 train_time:390705ms step_avg:221.49ms step:1765/6710 train_time:390935ms step_avg:221.49ms step:1766/6710 train_time:391161ms step_avg:221.50ms step:1767/6710 train_time:391386ms step_avg:221.50ms step:1768/6710 train_time:391610ms step_avg:221.50ms step:1769/6710 train_time:391836ms step_avg:221.50ms step:1770/6710 train_time:392062ms step_avg:221.50ms step:1771/6710 train_time:392287ms step_avg:221.51ms step:1772/6710 train_time:392512ms step_avg:221.51ms step:1773/6710 train_time:392738ms step_avg:221.51ms step:1774/6710 train_time:392965ms step_avg:221.51ms step:1775/6710 train_time:393192ms step_avg:221.52ms step:1776/6710 train_time:393418ms step_avg:221.52ms step:1777/6710 train_time:393643ms step_avg:221.52ms step:1778/6710 train_time:393869ms step_avg:221.52ms step:1779/6710 train_time:394097ms step_avg:221.53ms step:1780/6710 train_time:394322ms step_avg:221.53ms step:1781/6710 train_time:394547ms step_avg:221.53ms step:1782/6710 train_time:394772ms step_avg:221.53ms step:1783/6710 train_time:394999ms step_avg:221.54ms step:1784/6710 train_time:395227ms step_avg:221.54ms step:1785/6710 train_time:395452ms step_avg:221.54ms step:1786/6710 train_time:395677ms step_avg:221.54ms step:1787/6710 train_time:395904ms step_avg:221.55ms step:1788/6710 train_time:396130ms step_avg:221.55ms step:1789/6710 train_time:396357ms step_avg:221.55ms step:1790/6710 train_time:396582ms step_avg:221.55ms step:1791/6710 train_time:396807ms step_avg:221.56ms step:1792/6710 train_time:397034ms step_avg:221.56ms step:1793/6710 train_time:397260ms step_avg:221.56ms step:1794/6710 train_time:397486ms step_avg:221.56ms step:1795/6710 train_time:397712ms step_avg:221.57ms step:1796/6710 train_time:397939ms step_avg:221.57ms step:1797/6710 train_time:398165ms step_avg:221.57ms step:1798/6710 train_time:398392ms step_avg:221.57ms step:1799/6710 train_time:398617ms step_avg:221.58ms step:1800/6710 train_time:398844ms step_avg:221.58ms step:1801/6710 train_time:399070ms step_avg:221.58ms step:1802/6710 train_time:399298ms step_avg:221.59ms step:1803/6710 train_time:399523ms step_avg:221.59ms step:1804/6710 train_time:399749ms step_avg:221.59ms step:1805/6710 train_time:399977ms step_avg:221.59ms step:1806/6710 train_time:400203ms step_avg:221.60ms step:1807/6710 train_time:400429ms step_avg:221.60ms step:1808/6710 train_time:400655ms step_avg:221.60ms step:1809/6710 train_time:400882ms step_avg:221.60ms step:1810/6710 train_time:401107ms step_avg:221.61ms step:1811/6710 train_time:401333ms step_avg:221.61ms step:1812/6710 train_time:401559ms step_avg:221.61ms step:1813/6710 train_time:401785ms step_avg:221.61ms step:1814/6710 train_time:402011ms step_avg:221.62ms step:1815/6710 train_time:402238ms step_avg:221.62ms step:1816/6710 train_time:402463ms step_avg:221.62ms step:1817/6710 train_time:402689ms step_avg:221.62ms step:1818/6710 train_time:402915ms step_avg:221.63ms step:1819/6710 train_time:403141ms step_avg:221.63ms step:1820/6710 train_time:403368ms step_avg:221.63ms step:1821/6710 train_time:403595ms step_avg:221.63ms step:1822/6710 train_time:403821ms step_avg:221.64ms step:1823/6710 train_time:404048ms step_avg:221.64ms step:1824/6710 train_time:404273ms step_avg:221.64ms step:1825/6710 train_time:404501ms step_avg:221.64ms step:1826/6710 train_time:404726ms step_avg:221.65ms step:1827/6710 train_time:404952ms step_avg:221.65ms step:1828/6710 train_time:405180ms step_avg:221.65ms step:1829/6710 train_time:405405ms step_avg:221.65ms step:1830/6710 train_time:405633ms step_avg:221.66ms step:1831/6710 train_time:405858ms step_avg:221.66ms step:1832/6710 train_time:406084ms step_avg:221.66ms step:1833/6710 train_time:406310ms step_avg:221.66ms step:1834/6710 train_time:406536ms step_avg:221.67ms step:1835/6710 train_time:406764ms step_avg:221.67ms step:1836/6710 train_time:406990ms step_avg:221.67ms step:1837/6710 train_time:407217ms step_avg:221.68ms step:1838/6710 train_time:407443ms step_avg:221.68ms step:1839/6710 train_time:407670ms step_avg:221.68ms step:1840/6710 train_time:407898ms step_avg:221.68ms step:1841/6710 train_time:408124ms step_avg:221.69ms step:1842/6710 train_time:408350ms step_avg:221.69ms step:1843/6710 train_time:408578ms step_avg:221.69ms step:1844/6710 train_time:408804ms step_avg:221.69ms step:1845/6710 train_time:409029ms step_avg:221.70ms step:1846/6710 train_time:409255ms step_avg:221.70ms step:1847/6710 train_time:409483ms step_avg:221.70ms step:1848/6710 train_time:409709ms step_avg:221.70ms step:1849/6710 train_time:409936ms step_avg:221.71ms step:1850/6710 train_time:410162ms step_avg:221.71ms step:1851/6710 train_time:410388ms step_avg:221.71ms step:1852/6710 train_time:410614ms step_avg:221.71ms step:1853/6710 train_time:410840ms step_avg:221.72ms step:1854/6710 train_time:411066ms step_avg:221.72ms step:1855/6710 train_time:411292ms step_avg:221.72ms step:1856/6710 train_time:411518ms step_avg:221.72ms step:1857/6710 train_time:411744ms step_avg:221.73ms step:1858/6710 train_time:411971ms step_avg:221.73ms step:1859/6710 train_time:412198ms step_avg:221.73ms step:1860/6710 train_time:412423ms step_avg:221.73ms step:1861/6710 train_time:412649ms step_avg:221.74ms step:1862/6710 train_time:412875ms step_avg:221.74ms step:1863/6710 train_time:413102ms step_avg:221.74ms step:1864/6710 train_time:413326ms step_avg:221.74ms step:1865/6710 train_time:413553ms step_avg:221.74ms step:1866/6710 train_time:413780ms step_avg:221.75ms step:1867/6710 train_time:414006ms step_avg:221.75ms step:1868/6710 train_time:414232ms step_avg:221.75ms step:1869/6710 train_time:414458ms step_avg:221.75ms step:1870/6710 train_time:414683ms step_avg:221.76ms step:1871/6710 train_time:414910ms step_avg:221.76ms step:1872/6710 train_time:415136ms step_avg:221.76ms step:1873/6710 train_time:415362ms step_avg:221.76ms step:1874/6710 train_time:415586ms step_avg:221.76ms step:1875/6710 train_time:415812ms step_avg:221.77ms step:1875/6710 val_loss:3.276423 train_time:415990ms step_avg:221.86ms Parameter containing: tensor([1.0000, 1.0000, 0.4149, 1.0000, 0.6924, 1.0000, 0.5848, 1.0000], device='cuda:0', requires_grad=True) 0 [5.262783050537109, 4.262781143188477] 1 [0.6112073659896851, 4.184235572814941] 2 [0.8838950395584106, 3.407409191131592] 3 [0.6606908440589905, 2.6169395446777344] 4 [0.30422574281692505, 1.9224286079406738] 5 [0.8276634216308594, 3.028897523880005] 6 [0.5315368175506592, 2.7013866901397705] 7 [0.8510998487472534, 4.2756028175354] 8 [0.3935028910636902, 1.740257740020752] 9 [0.5277939438819885, 2.407907485961914] 10 [0.6639182567596436, 2.5776214599609375] 11 [0.44376981258392334, 2.5472829341888428] 12 [1.068073034286499, 4.333664894104004] 13 [1.0949108600616455, 2.8335983753204346] 14 [0.9737492203712463, 2.1018927097320557] 15 [0.7793194055557251, 1.7758796215057373] 0 [9.508862495422363, 20.282073974609375, 20.983169555664062] 1 [25.015766143798828, 20.577836990356445, 50.05152130126953] 2 [62.607479095458984, 18.33133888244629, 23.86572265625] 3 [53.86604309082031, 21.536518096923828, 27.925785064697266] 4 [24.583717346191406, 20.321683883666992, 18.40437126159668] 5 [41.15494155883789, 18.73263931274414, 28.671356201171875] 6 [37.14326858520508, 21.097274780273438, 21.650510787963867] 7 [53.998661041259766, 0.0, 38.84406661987305] 8 [31.155317306518555, 23.722091674804688, 35.46706771850586] 9 [52.86915588378906, 20.15357208251953, 28.266828536987305] 10 [70.66366577148438, 17.27853012084961, 25.445838928222656] 11 [52.287288665771484, 24.655086517333984, 14.198713302612305] 12 [82.06964111328125, 16.887693405151367, 17.872983932495117] 13 [109.39286804199219, 17.44381332397461, 24.233617782592773] 14 [120.49622344970703, 20.980514526367188, 35.163047790527344] 15 [108.20516204833984, 63.53549575805664, 91.51300048828125] step:1876/6710 train_time:416039ms step_avg:221.77ms step:1877/6710 train_time:416262ms step_avg:221.77ms step:1878/6710 train_time:416493ms step_avg:221.77ms step:1879/6710 train_time:416719ms step_avg:221.78ms step:1880/6710 train_time:416945ms step_avg:221.78ms step:1881/6710 train_time:417172ms step_avg:221.78ms step:1882/6710 train_time:417400ms step_avg:221.79ms step:1883/6710 train_time:417625ms step_avg:221.79ms step:1884/6710 train_time:417848ms step_avg:221.79ms step:1885/6710 train_time:418075ms step_avg:221.79ms step:1886/6710 train_time:418303ms step_avg:221.79ms step:1887/6710 train_time:418530ms step_avg:221.80ms step:1888/6710 train_time:418756ms step_avg:221.80ms step:1889/6710 train_time:418982ms step_avg:221.80ms step:1890/6710 train_time:419207ms step_avg:221.80ms step:1891/6710 train_time:419434ms step_avg:221.81ms step:1892/6710 train_time:419661ms step_avg:221.81ms step:1893/6710 train_time:419886ms step_avg:221.81ms step:1894/6710 train_time:420113ms step_avg:221.81ms step:1895/6710 train_time:420340ms step_avg:221.82ms step:1896/6710 train_time:420566ms step_avg:221.82ms step:1897/6710 train_time:420789ms step_avg:221.82ms step:1898/6710 train_time:421015ms step_avg:221.82ms step:1899/6710 train_time:421242ms step_avg:221.82ms step:1900/6710 train_time:421470ms step_avg:221.83ms step:1901/6710 train_time:421695ms step_avg:221.83ms step:1902/6710 train_time:421922ms step_avg:221.83ms step:1903/6710 train_time:422148ms step_avg:221.83ms step:1904/6710 train_time:422372ms step_avg:221.83ms step:1905/6710 train_time:422600ms step_avg:221.84ms step:1906/6710 train_time:422826ms step_avg:221.84ms step:1907/6710 train_time:423050ms step_avg:221.84ms step:1908/6710 train_time:423278ms step_avg:221.84ms step:1909/6710 train_time:423505ms step_avg:221.85ms step:1910/6710 train_time:423730ms step_avg:221.85ms step:1911/6710 train_time:423955ms step_avg:221.85ms step:1912/6710 train_time:424181ms step_avg:221.85ms step:1913/6710 train_time:424408ms step_avg:221.85ms step:1914/6710 train_time:424634ms step_avg:221.86ms step:1915/6710 train_time:424860ms step_avg:221.86ms step:1916/6710 train_time:425086ms step_avg:221.86ms step:1917/6710 train_time:425312ms step_avg:221.86ms step:1918/6710 train_time:425539ms step_avg:221.87ms step:1919/6710 train_time:425766ms step_avg:221.87ms step:1920/6710 train_time:425991ms step_avg:221.87ms step:1921/6710 train_time:426216ms step_avg:221.87ms step:1922/6710 train_time:426443ms step_avg:221.87ms step:1923/6710 train_time:426669ms step_avg:221.88ms step:1924/6710 train_time:426896ms step_avg:221.88ms step:1925/6710 train_time:427123ms step_avg:221.88ms step:1926/6710 train_time:427349ms step_avg:221.88ms step:1927/6710 train_time:427574ms step_avg:221.89ms step:1928/6710 train_time:427801ms step_avg:221.89ms step:1929/6710 train_time:428027ms step_avg:221.89ms step:1930/6710 train_time:428251ms step_avg:221.89ms step:1931/6710 train_time:428477ms step_avg:221.89ms step:1932/6710 train_time:428705ms step_avg:221.90ms step:1933/6710 train_time:428929ms step_avg:221.90ms step:1934/6710 train_time:429154ms step_avg:221.90ms step:1935/6710 train_time:429380ms step_avg:221.90ms step:1936/6710 train_time:429606ms step_avg:221.90ms step:1937/6710 train_time:429833ms step_avg:221.91ms step:1938/6710 train_time:430059ms step_avg:221.91ms step:1939/6710 train_time:430285ms step_avg:221.91ms step:1940/6710 train_time:430509ms step_avg:221.91ms step:1941/6710 train_time:430735ms step_avg:221.91ms step:1942/6710 train_time:430962ms step_avg:221.92ms step:1943/6710 train_time:431189ms step_avg:221.92ms step:1944/6710 train_time:431414ms step_avg:221.92ms step:1945/6710 train_time:431641ms step_avg:221.92ms step:1946/6710 train_time:431868ms step_avg:221.93ms step:1947/6710 train_time:432093ms step_avg:221.93ms step:1948/6710 train_time:432319ms step_avg:221.93ms step:1949/6710 train_time:432547ms step_avg:221.93ms step:1950/6710 train_time:432773ms step_avg:221.93ms step:1951/6710 train_time:432998ms step_avg:221.94ms step:1952/6710 train_time:433226ms step_avg:221.94ms step:1953/6710 train_time:433452ms step_avg:221.94ms step:1954/6710 train_time:433680ms step_avg:221.94ms step:1955/6710 train_time:433907ms step_avg:221.95ms step:1956/6710 train_time:434133ms step_avg:221.95ms step:1957/6710 train_time:434359ms step_avg:221.95ms step:1958/6710 train_time:434585ms step_avg:221.95ms step:1959/6710 train_time:434811ms step_avg:221.96ms step:1960/6710 train_time:435036ms step_avg:221.96ms step:1961/6710 train_time:435263ms step_avg:221.96ms step:1962/6710 train_time:435488ms step_avg:221.96ms step:1963/6710 train_time:435714ms step_avg:221.96ms step:1964/6710 train_time:435941ms step_avg:221.97ms step:1965/6710 train_time:436167ms step_avg:221.97ms step:1966/6710 train_time:436393ms step_avg:221.97ms step:1967/6710 train_time:436619ms step_avg:221.97ms step:1968/6710 train_time:436846ms step_avg:221.97ms step:1969/6710 train_time:437070ms step_avg:221.98ms step:1970/6710 train_time:437296ms step_avg:221.98ms step:1971/6710 train_time:437524ms step_avg:221.98ms step:1972/6710 train_time:437748ms step_avg:221.98ms step:1973/6710 train_time:437974ms step_avg:221.98ms step:1974/6710 train_time:438200ms step_avg:221.99ms step:1975/6710 train_time:438427ms step_avg:221.99ms step:1976/6710 train_time:438652ms step_avg:221.99ms step:1977/6710 train_time:438877ms step_avg:221.99ms step:1978/6710 train_time:439104ms step_avg:221.99ms step:1979/6710 train_time:439331ms step_avg:222.00ms step:1980/6710 train_time:439555ms step_avg:222.00ms step:1981/6710 train_time:439782ms step_avg:222.00ms step:1982/6710 train_time:440009ms step_avg:222.00ms step:1983/6710 train_time:440234ms step_avg:222.00ms step:1984/6710 train_time:440460ms step_avg:222.01ms step:1985/6710 train_time:440686ms step_avg:222.01ms step:1986/6710 train_time:440911ms step_avg:222.01ms step:1987/6710 train_time:441136ms step_avg:222.01ms step:1988/6710 train_time:441362ms step_avg:222.01ms step:1989/6710 train_time:441589ms step_avg:222.02ms step:1990/6710 train_time:441816ms step_avg:222.02ms step:1991/6710 train_time:442044ms step_avg:222.02ms step:1992/6710 train_time:442269ms step_avg:222.02ms step:1993/6710 train_time:442496ms step_avg:222.03ms step:1994/6710 train_time:442723ms step_avg:222.03ms step:1995/6710 train_time:442949ms step_avg:222.03ms step:1996/6710 train_time:443176ms step_avg:222.03ms step:1997/6710 train_time:443402ms step_avg:222.03ms step:1998/6710 train_time:443628ms step_avg:222.04ms step:1999/6710 train_time:443853ms step_avg:222.04ms step:2000/6710 train_time:444081ms step_avg:222.04ms step:2000/6710 val_loss:3.254454 train_time:444259ms step_avg:222.13ms Parameter containing: tensor([1.0000, 1.0000, 0.4084, 1.0000, 0.6819, 1.0000, 0.5671, 1.0000], device='cuda:0', requires_grad=True) 0 [5.493679046630859, 4.493677139282227] 1 [0.6089092493057251, 4.428009033203125] 2 [0.8809236288070679, 3.579231023788452] 3 [0.6628202795982361, 2.770965099334717] 4 [0.30599382519721985, 2.021618127822876] 5 [0.8202694654464722, 3.1740593910217285] 6 [0.532674252986908, 2.804563045501709] 7 [0.8300620317459106, 4.48565673828125] 8 [0.3904864192008972, 1.7703320980072021] 9 [0.5215399861335754, 2.47442626953125] 10 [0.6634827256202698, 2.6793315410614014] 11 [0.4411710798740387, 2.6345911026000977] 12 [1.06203293800354, 4.515466690063477] 13 [1.0977163314819336, 2.9315996170043945] 14 [0.9741932153701782, 2.142749071121216] 15 [0.7823517918586731, 1.7779202461242676] 0 [9.972466468811035, 21.214834213256836, 21.896055221557617] 1 [26.065900802612305, 21.6246280670166, 53.10434341430664] 2 [65.6492919921875, 19.283857345581055, 24.807205200195312] 3 [56.55989456176758, 22.850994110107422, 29.11052131652832] 4 [25.88116455078125, 21.34423828125, 19.724699020385742] 5 [43.00420379638672, 19.859634399414062, 30.636703491210938] 6 [39.1717643737793, 22.46973419189453, 22.83962631225586] 7 [55.613956451416016, 0.0, 40.446048736572266] 8 [31.975784301757812, 24.987154006958008, 36.939796447753906] 9 [53.8613395690918, 21.26601219177246, 29.72886085510254] 10 [72.81573486328125, 18.501190185546875, 26.848711013793945] 11 [53.818756103515625, 25.621723175048828, 14.73881721496582] 12 [84.27542877197266, 18.069883346557617, 18.32025146484375] 13 [113.0115737915039, 18.302148818969727, 24.812175750732422] 14 [124.39861297607422, 21.847515106201172, 36.32484817504883] 15 [112.20740509033203, 66.73453521728516, 95.34567260742188] step:2001/6710 train_time:444307ms step_avg:222.04ms step:2002/6710 train_time:444533ms step_avg:222.04ms step:2003/6710 train_time:444765ms step_avg:222.05ms step:2004/6710 train_time:444990ms step_avg:222.05ms step:2005/6710 train_time:445217ms step_avg:222.05ms step:2006/6710 train_time:445445ms step_avg:222.06ms step:2007/6710 train_time:445672ms step_avg:222.06ms step:2008/6710 train_time:445900ms step_avg:222.06ms step:2009/6710 train_time:446124ms step_avg:222.06ms step:2010/6710 train_time:446353ms step_avg:222.07ms step:2011/6710 train_time:446581ms step_avg:222.07ms step:2012/6710 train_time:446808ms step_avg:222.07ms step:2013/6710 train_time:447036ms step_avg:222.07ms step:2014/6710 train_time:447264ms step_avg:222.08ms step:2015/6710 train_time:447491ms step_avg:222.08ms step:2016/6710 train_time:447717ms step_avg:222.08ms step:2017/6710 train_time:447944ms step_avg:222.08ms step:2018/6710 train_time:448173ms step_avg:222.09ms step:2019/6710 train_time:448400ms step_avg:222.09ms step:2020/6710 train_time:448626ms step_avg:222.09ms step:2021/6710 train_time:448854ms step_avg:222.09ms step:2022/6710 train_time:449080ms step_avg:222.10ms step:2023/6710 train_time:449305ms step_avg:222.10ms step:2024/6710 train_time:449532ms step_avg:222.10ms step:2025/6710 train_time:449761ms step_avg:222.10ms step:2026/6710 train_time:449987ms step_avg:222.11ms step:2027/6710 train_time:450214ms step_avg:222.11ms step:2028/6710 train_time:450441ms step_avg:222.11ms step:2029/6710 train_time:450667ms step_avg:222.11ms step:2030/6710 train_time:450896ms step_avg:222.12ms step:2031/6710 train_time:451121ms step_avg:222.12ms step:2032/6710 train_time:451348ms step_avg:222.12ms step:2033/6710 train_time:451576ms step_avg:222.12ms step:2034/6710 train_time:451802ms step_avg:222.13ms step:2035/6710 train_time:452029ms step_avg:222.13ms step:2036/6710 train_time:452255ms step_avg:222.13ms step:2037/6710 train_time:452484ms step_avg:222.13ms step:2038/6710 train_time:452709ms step_avg:222.13ms step:2039/6710 train_time:452936ms step_avg:222.14ms step:2040/6710 train_time:453163ms step_avg:222.14ms step:2041/6710 train_time:453389ms step_avg:222.14ms step:2042/6710 train_time:453616ms step_avg:222.14ms step:2043/6710 train_time:453842ms step_avg:222.15ms step:2044/6710 train_time:454068ms step_avg:222.15ms step:2045/6710 train_time:454296ms step_avg:222.15ms step:2046/6710 train_time:454522ms step_avg:222.15ms step:2047/6710 train_time:454748ms step_avg:222.15ms step:2048/6710 train_time:454976ms step_avg:222.16ms step:2049/6710 train_time:455205ms step_avg:222.16ms step:2050/6710 train_time:455432ms step_avg:222.16ms step:2051/6710 train_time:455658ms step_avg:222.16ms step:2052/6710 train_time:455886ms step_avg:222.17ms step:2053/6710 train_time:456113ms step_avg:222.17ms step:2054/6710 train_time:456340ms step_avg:222.17ms step:2055/6710 train_time:456565ms step_avg:222.17ms step:2056/6710 train_time:456791ms step_avg:222.17ms step:2057/6710 train_time:457019ms step_avg:222.18ms step:2058/6710 train_time:457245ms step_avg:222.18ms step:2059/6710 train_time:457472ms step_avg:222.18ms step:2060/6710 train_time:457698ms step_avg:222.18ms step:2061/6710 train_time:457924ms step_avg:222.19ms step:2062/6710 train_time:458152ms step_avg:222.19ms step:2063/6710 train_time:458380ms step_avg:222.19ms step:2064/6710 train_time:458606ms step_avg:222.19ms step:2065/6710 train_time:458832ms step_avg:222.19ms step:2066/6710 train_time:459059ms step_avg:222.20ms step:2067/6710 train_time:459286ms step_avg:222.20ms step:2068/6710 train_time:459512ms step_avg:222.20ms step:2069/6710 train_time:459740ms step_avg:222.20ms step:2070/6710 train_time:459967ms step_avg:222.21ms step:2071/6710 train_time:460192ms step_avg:222.21ms step:2072/6710 train_time:460419ms step_avg:222.21ms step:2073/6710 train_time:460644ms step_avg:222.21ms step:2074/6710 train_time:460872ms step_avg:222.21ms step:2075/6710 train_time:461100ms step_avg:222.22ms step:2076/6710 train_time:461325ms step_avg:222.22ms step:2077/6710 train_time:461551ms step_avg:222.22ms step:2078/6710 train_time:461780ms step_avg:222.22ms step:2079/6710 train_time:462006ms step_avg:222.22ms step:2080/6710 train_time:462232ms step_avg:222.23ms step:2081/6710 train_time:462460ms step_avg:222.23ms step:2082/6710 train_time:462686ms step_avg:222.23ms step:2083/6710 train_time:462913ms step_avg:222.23ms step:2084/6710 train_time:463141ms step_avg:222.24ms step:2085/6710 train_time:463366ms step_avg:222.24ms step:2086/6710 train_time:463592ms step_avg:222.24ms step:2087/6710 train_time:463819ms step_avg:222.24ms step:2088/6710 train_time:464047ms step_avg:222.24ms step:2089/6710 train_time:464274ms step_avg:222.25ms step:2090/6710 train_time:464502ms step_avg:222.25ms step:2091/6710 train_time:464727ms step_avg:222.25ms step:2092/6710 train_time:464953ms step_avg:222.25ms step:2093/6710 train_time:465181ms step_avg:222.26ms step:2094/6710 train_time:465407ms step_avg:222.26ms step:2095/6710 train_time:465634ms step_avg:222.26ms step:2096/6710 train_time:465860ms step_avg:222.26ms step:2097/6710 train_time:466087ms step_avg:222.26ms step:2098/6710 train_time:466314ms step_avg:222.27ms step:2099/6710 train_time:466542ms step_avg:222.27ms step:2100/6710 train_time:466767ms step_avg:222.27ms step:2101/6710 train_time:466993ms step_avg:222.27ms step:2102/6710 train_time:467220ms step_avg:222.27ms step:2103/6710 train_time:467446ms step_avg:222.28ms step:2104/6710 train_time:467674ms step_avg:222.28ms step:2105/6710 train_time:467901ms step_avg:222.28ms step:2106/6710 train_time:468127ms step_avg:222.28ms step:2107/6710 train_time:468354ms step_avg:222.28ms step:2108/6710 train_time:468583ms step_avg:222.29ms step:2109/6710 train_time:468808ms step_avg:222.29ms step:2110/6710 train_time:469035ms step_avg:222.29ms step:2111/6710 train_time:469262ms step_avg:222.29ms step:2112/6710 train_time:469488ms step_avg:222.30ms step:2113/6710 train_time:469716ms step_avg:222.30ms step:2114/6710 train_time:469941ms step_avg:222.30ms step:2115/6710 train_time:470166ms step_avg:222.30ms step:2116/6710 train_time:470393ms step_avg:222.30ms step:2117/6710 train_time:470621ms step_avg:222.31ms step:2118/6710 train_time:470847ms step_avg:222.31ms step:2119/6710 train_time:471073ms step_avg:222.31ms step:2120/6710 train_time:471301ms step_avg:222.31ms step:2121/6710 train_time:471526ms step_avg:222.31ms step:2122/6710 train_time:471754ms step_avg:222.32ms step:2123/6710 train_time:471980ms step_avg:222.32ms step:2124/6710 train_time:472205ms step_avg:222.32ms step:2125/6710 train_time:472431ms step_avg:222.32ms step:2125/6710 val_loss:3.241350 train_time:472610ms step_avg:222.40ms Parameter containing: tensor([1.0000, 1.0000, 0.4122, 1.0000, 0.6797, 1.0000, 0.5749, 1.0000], device='cuda:0', requires_grad=True) 0 [5.701932430267334, 4.701930522918701] 1 [0.5993094444274902, 4.659180641174316] 2 [0.8690930604934692, 3.7327961921691895] 3 [0.6596499681472778, 2.930015802383423] 4 [0.3117554485797882, 2.116508960723877] 5 [0.8184296488761902, 3.298748254776001] 6 [0.5214141011238098, 2.8712193965911865] 7 [0.8381954431533813, 4.668008804321289] 8 [0.3978913724422455, 1.7780437469482422] 9 [0.5199402570724487, 2.502401828765869] 10 [0.6657601594924927, 2.7317357063293457] 11 [0.43924999237060547, 2.7086470127105713] 12 [1.0519959926605225, 4.720277309417725] 13 [1.096740484237671, 3.006510019302368] 14 [0.9761243462562561, 2.116412401199341] 15 [0.7824856042861938, 1.7020667791366577] 0 [10.390246391296387, 22.085346221923828, 23.010313034057617] 1 [26.86855125427246, 22.552494049072266, 54.80093765258789] 2 [66.9200668334961, 20.150283813476562, 25.70220184326172] 3 [57.79960250854492, 24.11147117614746, 29.779939651489258] 4 [27.07605743408203, 22.258474349975586, 20.447669982910156] 5 [44.654876708984375, 20.808692932128906, 32.0528678894043] 6 [39.856651306152344, 23.66878318786621, 23.894977569580078] 7 [57.7916374206543, 0.0, 41.98939514160156] 8 [33.739498138427734, 26.246755599975586, 38.98984146118164] 9 [56.2891960144043, 22.19251823425293, 30.989126205444336] 10 [75.97063446044922, 19.665966033935547, 28.07529640197754] 11 [55.87693786621094, 27.093353271484375, 15.610443115234375] 12 [87.29277038574219, 19.06072235107422, 19.2215518951416] 13 [117.35682678222656, 18.820558547973633, 25.7702693939209] 14 [129.345703125, 22.724611282348633, 37.686279296875] 15 [116.76273345947266, 70.98279571533203, 100.63632202148438] step:2126/6710 train_time:472660ms step_avg:222.32ms step:2127/6710 train_time:472881ms step_avg:222.32ms step:2128/6710 train_time:473112ms step_avg:222.33ms step:2129/6710 train_time:473337ms step_avg:222.33ms step:2130/6710 train_time:473563ms step_avg:222.33ms step:2131/6710 train_time:473790ms step_avg:222.33ms step:2132/6710 train_time:474018ms step_avg:222.33ms step:2133/6710 train_time:474244ms step_avg:222.34ms step:2134/6710 train_time:474469ms step_avg:222.34ms step:2135/6710 train_time:474698ms step_avg:222.34ms step:2136/6710 train_time:474924ms step_avg:222.34ms step:2137/6710 train_time:475151ms step_avg:222.34ms step:2138/6710 train_time:475379ms step_avg:222.35ms step:2139/6710 train_time:475606ms step_avg:222.35ms step:2140/6710 train_time:475833ms step_avg:222.35ms step:2141/6710 train_time:476061ms step_avg:222.35ms step:2142/6710 train_time:476287ms step_avg:222.36ms step:2143/6710 train_time:476512ms step_avg:222.36ms step:2144/6710 train_time:476740ms step_avg:222.36ms step:2145/6710 train_time:476966ms step_avg:222.36ms step:2146/6710 train_time:477193ms step_avg:222.36ms step:2147/6710 train_time:477420ms step_avg:222.37ms step:2148/6710 train_time:477646ms step_avg:222.37ms step:2149/6710 train_time:477873ms step_avg:222.37ms step:2150/6710 train_time:478100ms step_avg:222.37ms step:2151/6710 train_time:478325ms step_avg:222.37ms step:2152/6710 train_time:478552ms step_avg:222.38ms step:2153/6710 train_time:478780ms step_avg:222.38ms step:2154/6710 train_time:479005ms step_avg:222.38ms step:2155/6710 train_time:479232ms step_avg:222.38ms step:2156/6710 train_time:479459ms step_avg:222.38ms step:2157/6710 train_time:479685ms step_avg:222.39ms step:2158/6710 train_time:479910ms step_avg:222.39ms step:2159/6710 train_time:480137ms step_avg:222.39ms step:2160/6710 train_time:480364ms step_avg:222.39ms step:2161/6710 train_time:480591ms step_avg:222.39ms step:2162/6710 train_time:480818ms step_avg:222.40ms step:2163/6710 train_time:481044ms step_avg:222.40ms step:2164/6710 train_time:481270ms step_avg:222.40ms step:2165/6710 train_time:481498ms step_avg:222.40ms step:2166/6710 train_time:481725ms step_avg:222.40ms step:2167/6710 train_time:481953ms step_avg:222.41ms step:2168/6710 train_time:482182ms step_avg:222.41ms step:2169/6710 train_time:482407ms step_avg:222.41ms step:2170/6710 train_time:482637ms step_avg:222.41ms step:2171/6710 train_time:482864ms step_avg:222.42ms step:2172/6710 train_time:483091ms step_avg:222.42ms step:2173/6710 train_time:483318ms step_avg:222.42ms step:2174/6710 train_time:483543ms step_avg:222.42ms step:2175/6710 train_time:483770ms step_avg:222.42ms step:2176/6710 train_time:483998ms step_avg:222.43ms step:2177/6710 train_time:484224ms step_avg:222.43ms step:2178/6710 train_time:484449ms step_avg:222.43ms step:2179/6710 train_time:484677ms step_avg:222.43ms step:2180/6710 train_time:484903ms step_avg:222.43ms step:2181/6710 train_time:485129ms step_avg:222.43ms step:2182/6710 train_time:485357ms step_avg:222.44ms step:2183/6710 train_time:485583ms step_avg:222.44ms step:2184/6710 train_time:485811ms step_avg:222.44ms step:2185/6710 train_time:486038ms step_avg:222.44ms step:2186/6710 train_time:486264ms step_avg:222.44ms step:2187/6710 train_time:486489ms step_avg:222.45ms step:2188/6710 train_time:486716ms step_avg:222.45ms step:2189/6710 train_time:486944ms step_avg:222.45ms step:2190/6710 train_time:487171ms step_avg:222.45ms step:2191/6710 train_time:487398ms step_avg:222.45ms step:2192/6710 train_time:487623ms step_avg:222.46ms step:2193/6710 train_time:487850ms step_avg:222.46ms step:2194/6710 train_time:488078ms step_avg:222.46ms step:2195/6710 train_time:488305ms step_avg:222.46ms step:2196/6710 train_time:488531ms step_avg:222.46ms step:2197/6710 train_time:488760ms step_avg:222.47ms step:2198/6710 train_time:488986ms step_avg:222.47ms step:2199/6710 train_time:489211ms step_avg:222.47ms step:2200/6710 train_time:489439ms step_avg:222.47ms step:2201/6710 train_time:489665ms step_avg:222.47ms step:2202/6710 train_time:489892ms step_avg:222.48ms step:2203/6710 train_time:490120ms step_avg:222.48ms step:2204/6710 train_time:490347ms step_avg:222.48ms step:2205/6710 train_time:490573ms step_avg:222.48ms step:2206/6710 train_time:490801ms step_avg:222.48ms step:2207/6710 train_time:491028ms step_avg:222.49ms step:2208/6710 train_time:491254ms step_avg:222.49ms step:2209/6710 train_time:491482ms step_avg:222.49ms step:2210/6710 train_time:491709ms step_avg:222.49ms step:2211/6710 train_time:491936ms step_avg:222.49ms step:2212/6710 train_time:492162ms step_avg:222.50ms step:2213/6710 train_time:492388ms step_avg:222.50ms step:2214/6710 train_time:492614ms step_avg:222.50ms step:2215/6710 train_time:492842ms step_avg:222.50ms step:2216/6710 train_time:493068ms step_avg:222.50ms step:2217/6710 train_time:493297ms step_avg:222.51ms step:2218/6710 train_time:493523ms step_avg:222.51ms step:2219/6710 train_time:493750ms step_avg:222.51ms step:2220/6710 train_time:493978ms step_avg:222.51ms step:2221/6710 train_time:494204ms step_avg:222.51ms step:2222/6710 train_time:494431ms step_avg:222.52ms step:2223/6710 train_time:494659ms step_avg:222.52ms step:2224/6710 train_time:494886ms step_avg:222.52ms step:2225/6710 train_time:495110ms step_avg:222.52ms step:2226/6710 train_time:495340ms step_avg:222.52ms step:2227/6710 train_time:495565ms step_avg:222.53ms step:2228/6710 train_time:495791ms step_avg:222.53ms step:2229/6710 train_time:496018ms step_avg:222.53ms step:2230/6710 train_time:496245ms step_avg:222.53ms step:2231/6710 train_time:496472ms step_avg:222.53ms step:2232/6710 train_time:496701ms step_avg:222.54ms step:2233/6710 train_time:496927ms step_avg:222.54ms step:2234/6710 train_time:497154ms step_avg:222.54ms step:2235/6710 train_time:497382ms step_avg:222.54ms step:2236/6710 train_time:497608ms step_avg:222.54ms step:2237/6710 train_time:497836ms step_avg:222.55ms step:2238/6710 train_time:498065ms step_avg:222.55ms step:2239/6710 train_time:498292ms step_avg:222.55ms step:2240/6710 train_time:498520ms step_avg:222.55ms step:2241/6710 train_time:498746ms step_avg:222.55ms step:2242/6710 train_time:498973ms step_avg:222.56ms step:2243/6710 train_time:499200ms step_avg:222.56ms step:2244/6710 train_time:499425ms step_avg:222.56ms step:2245/6710 train_time:499651ms step_avg:222.56ms step:2246/6710 train_time:499879ms step_avg:222.56ms step:2247/6710 train_time:500104ms step_avg:222.57ms step:2248/6710 train_time:500330ms step_avg:222.57ms step:2249/6710 train_time:500557ms step_avg:222.57ms step:2250/6710 train_time:500782ms step_avg:222.57ms step:2250/6710 val_loss:3.231741 train_time:500962ms step_avg:222.65ms Parameter containing: tensor([1.0000, 1.0000, 0.4164, 1.0000, 0.6689, 1.0000, 0.5586, 1.0000], device='cuda:0', requires_grad=True) 0 [5.917022228240967, 4.917020320892334] 1 [0.590139627456665, 4.867969036102295] 2 [0.8648361563682556, 3.875638008117676] 3 [0.6748530864715576, 3.04642653465271] 4 [0.31170397996902466, 2.176778793334961] 5 [0.8149224519729614, 3.425365686416626] 6 [0.5214380621910095, 2.9603216648101807] 7 [0.8375823497772217, 4.864132881164551] 8 [0.4038662314414978, 1.7838599681854248] 9 [0.5098934173583984, 2.556083917617798] 10 [0.6595945954322815, 2.808319330215454] 11 [0.43722206354141235, 2.8004026412963867] 12 [1.040493130683899, 4.948275089263916] 13 [1.094214916229248, 3.1252987384796143] 14 [0.9761959314346313, 2.135460138320923] 15 [0.783202588558197, 1.679872989654541] 0 [10.820076942443848, 22.890329360961914, 24.301837921142578] 1 [27.668678283691406, 23.412675857543945, 57.10967254638672] 2 [69.07161712646484, 20.902847290039062, 27.1318302154541] 3 [61.10808181762695, 25.377775192260742, 31.4161434173584] 4 [28.545167922973633, 23.226913452148438, 21.348310470581055] 5 [46.49768829345703, 21.93979263305664, 33.29281234741211] 6 [41.421958923339844, 24.713748931884766, 24.72878074645996] 7 [59.85765075683594, 0.0, 43.22897720336914] 8 [35.33561325073242, 27.141281127929688, 40.819244384765625] 9 [56.91533279418945, 23.174034118652344, 32.547264099121094] 10 [77.11314392089844, 20.839340209960938, 29.531208038330078] 11 [57.268638610839844, 28.22524070739746, 16.23538589477539] 12 [89.08341217041016, 20.077102661132812, 19.974035263061523] 13 [120.26737976074219, 19.57748031616211, 26.790924072265625] 14 [132.96786499023438, 23.809907913208008, 39.993186950683594] 15 [120.82491302490234, 74.72376251220703, 110.45025634765625] step:2251/6710 train_time:501012ms step_avg:222.57ms step:2252/6710 train_time:501233ms step_avg:222.57ms step:2253/6710 train_time:501465ms step_avg:222.58ms step:2254/6710 train_time:501690ms step_avg:222.58ms step:2255/6710 train_time:501916ms step_avg:222.58ms step:2256/6710 train_time:502143ms step_avg:222.58ms step:2257/6710 train_time:502372ms step_avg:222.58ms step:2258/6710 train_time:502599ms step_avg:222.59ms step:2259/6710 train_time:502824ms step_avg:222.59ms step:2260/6710 train_time:503051ms step_avg:222.59ms step:2261/6710 train_time:503278ms step_avg:222.59ms step:2262/6710 train_time:503504ms step_avg:222.59ms step:2263/6710 train_time:503730ms step_avg:222.59ms step:2264/6710 train_time:503956ms step_avg:222.60ms step:2265/6710 train_time:504183ms step_avg:222.60ms step:2266/6710 train_time:504411ms step_avg:222.60ms step:2267/6710 train_time:504639ms step_avg:222.60ms step:2268/6710 train_time:504866ms step_avg:222.60ms step:2269/6710 train_time:505093ms step_avg:222.61ms step:2270/6710 train_time:505320ms step_avg:222.61ms step:2271/6710 train_time:505547ms step_avg:222.61ms step:2272/6710 train_time:505774ms step_avg:222.61ms step:2273/6710 train_time:506000ms step_avg:222.61ms step:2274/6710 train_time:506225ms step_avg:222.61ms step:2275/6710 train_time:506453ms step_avg:222.62ms step:2276/6710 train_time:506679ms step_avg:222.62ms step:2277/6710 train_time:506905ms step_avg:222.62ms step:2278/6710 train_time:507133ms step_avg:222.62ms step:2279/6710 train_time:507359ms step_avg:222.62ms step:2280/6710 train_time:507584ms step_avg:222.62ms step:2281/6710 train_time:507812ms step_avg:222.63ms step:2282/6710 train_time:508039ms step_avg:222.63ms step:2283/6710 train_time:508267ms step_avg:222.63ms step:2284/6710 train_time:508495ms step_avg:222.63ms step:2285/6710 train_time:508722ms step_avg:222.64ms step:2286/6710 train_time:508949ms step_avg:222.64ms step:2287/6710 train_time:509176ms step_avg:222.64ms step:2288/6710 train_time:509402ms step_avg:222.64ms step:2289/6710 train_time:509629ms step_avg:222.64ms step:2290/6710 train_time:509857ms step_avg:222.65ms step:2291/6710 train_time:510082ms step_avg:222.65ms step:2292/6710 train_time:510308ms step_avg:222.65ms step:2293/6710 train_time:510537ms step_avg:222.65ms step:2294/6710 train_time:510762ms step_avg:222.65ms step:2295/6710 train_time:510988ms step_avg:222.65ms step:2296/6710 train_time:511217ms step_avg:222.66ms step:2297/6710 train_time:511443ms step_avg:222.66ms step:2298/6710 train_time:511672ms step_avg:222.66ms step:2299/6710 train_time:511898ms step_avg:222.66ms step:2300/6710 train_time:512124ms step_avg:222.66ms step:2301/6710 train_time:512351ms step_avg:222.66ms step:2302/6710 train_time:512578ms step_avg:222.67ms step:2303/6710 train_time:512804ms step_avg:222.67ms step:2304/6710 train_time:513031ms step_avg:222.67ms step:2305/6710 train_time:513258ms step_avg:222.67ms step:2306/6710 train_time:513485ms step_avg:222.67ms step:2307/6710 train_time:513714ms step_avg:222.68ms step:2308/6710 train_time:513939ms step_avg:222.68ms step:2309/6710 train_time:514165ms step_avg:222.68ms step:2310/6710 train_time:514391ms step_avg:222.68ms step:2311/6710 train_time:514618ms step_avg:222.68ms step:2312/6710 train_time:514846ms step_avg:222.68ms step:2313/6710 train_time:515073ms step_avg:222.69ms step:2314/6710 train_time:515298ms step_avg:222.69ms step:2315/6710 train_time:515525ms step_avg:222.69ms step:2316/6710 train_time:515751ms step_avg:222.69ms step:2317/6710 train_time:515978ms step_avg:222.69ms step:2318/6710 train_time:516205ms step_avg:222.69ms step:2319/6710 train_time:516431ms step_avg:222.70ms step:2320/6710 train_time:516658ms step_avg:222.70ms step:2321/6710 train_time:516885ms step_avg:222.70ms step:2322/6710 train_time:517111ms step_avg:222.70ms step:2323/6710 train_time:517338ms step_avg:222.70ms step:2324/6710 train_time:517563ms step_avg:222.70ms step:2325/6710 train_time:517792ms step_avg:222.71ms step:2326/6710 train_time:518018ms step_avg:222.71ms step:2327/6710 train_time:518245ms step_avg:222.71ms step:2328/6710 train_time:518474ms step_avg:222.71ms step:2329/6710 train_time:518700ms step_avg:222.71ms step:2330/6710 train_time:518928ms step_avg:222.72ms step:2331/6710 train_time:519156ms step_avg:222.72ms step:2332/6710 train_time:519381ms step_avg:222.72ms step:2333/6710 train_time:519609ms step_avg:222.72ms step:2334/6710 train_time:519835ms step_avg:222.72ms step:2335/6710 train_time:520061ms step_avg:222.72ms step:2336/6710 train_time:520289ms step_avg:222.73ms step:2337/6710 train_time:520516ms step_avg:222.73ms step:2338/6710 train_time:520741ms step_avg:222.73ms step:2339/6710 train_time:520969ms step_avg:222.73ms step:2340/6710 train_time:521196ms step_avg:222.73ms step:2341/6710 train_time:521420ms step_avg:222.73ms step:2342/6710 train_time:521648ms step_avg:222.74ms step:2343/6710 train_time:521875ms step_avg:222.74ms step:2344/6710 train_time:522100ms step_avg:222.74ms step:2345/6710 train_time:522329ms step_avg:222.74ms step:2346/6710 train_time:522556ms step_avg:222.74ms step:2347/6710 train_time:522781ms step_avg:222.74ms step:2348/6710 train_time:523008ms step_avg:222.75ms step:2349/6710 train_time:523235ms step_avg:222.75ms step:2350/6710 train_time:523460ms step_avg:222.75ms step:2351/6710 train_time:523686ms step_avg:222.75ms step:2352/6710 train_time:523913ms step_avg:222.75ms step:2353/6710 train_time:524139ms step_avg:222.75ms step:2354/6710 train_time:524366ms step_avg:222.76ms step:2355/6710 train_time:524593ms step_avg:222.76ms step:2356/6710 train_time:524819ms step_avg:222.76ms step:2357/6710 train_time:525045ms step_avg:222.76ms step:2358/6710 train_time:525272ms step_avg:222.76ms step:2359/6710 train_time:525500ms step_avg:222.76ms step:2360/6710 train_time:525726ms step_avg:222.77ms step:2361/6710 train_time:525953ms step_avg:222.77ms step:2362/6710 train_time:526179ms step_avg:222.77ms step:2363/6710 train_time:526406ms step_avg:222.77ms step:2364/6710 train_time:526634ms step_avg:222.77ms step:2365/6710 train_time:526859ms step_avg:222.77ms step:2366/6710 train_time:527087ms step_avg:222.78ms step:2367/6710 train_time:527315ms step_avg:222.78ms step:2368/6710 train_time:527539ms step_avg:222.78ms step:2369/6710 train_time:527766ms step_avg:222.78ms step:2370/6710 train_time:527994ms step_avg:222.78ms step:2371/6710 train_time:528220ms step_avg:222.78ms step:2372/6710 train_time:528446ms step_avg:222.79ms step:2373/6710 train_time:528674ms step_avg:222.79ms step:2374/6710 train_time:528900ms step_avg:222.79ms step:2375/6710 train_time:529128ms step_avg:222.79ms step:2375/6710 val_loss:3.223378 train_time:529307ms step_avg:222.87ms Parameter containing: tensor([1.0000, 1.0000, 0.4093, 1.0000, 0.6613, 1.0000, 0.5592, 1.0000], device='cuda:0', requires_grad=True) 0 [6.154876232147217, 5.154874324798584] 1 [0.5831645727157593, 5.11405086517334] 2 [0.8511971831321716, 4.041112899780273] 3 [0.6719501614570618, 3.202329397201538] 4 [0.31460678577423096, 2.2747716903686523] 5 [0.806015133857727, 3.5819244384765625] 6 [0.5199621319770813, 3.021547317504883] 7 [0.8288049697875977, 5.025668144226074] 8 [0.41118526458740234, 1.7803525924682617] 9 [0.5074359178543091, 2.605292797088623] 10 [0.6585848927497864, 2.88925838470459] 11 [0.4354667365550995, 2.9032158851623535] 12 [1.0378068685531616, 5.167573928833008] 13 [1.0962258577346802, 3.233675479888916] 14 [0.9819548726081848, 2.1429874897003174] 15 [0.7912741899490356, 1.6461806297302246] 0 [11.29409408569336, 23.839569091796875, 25.066184997558594] 1 [28.376684188842773, 24.33912467956543, 58.40599822998047] 2 [69.68989562988281, 21.55999183654785, 28.138629913330078] 3 [61.935543060302734, 26.349178314208984, 32.5780143737793] 4 [29.415267944335938, 24.021419525146484, 22.336589813232422] 5 [47.584434509277344, 22.926956176757812, 34.56752395629883] 6 [42.53472137451172, 25.709320068359375, 25.77074432373047] 7 [61.14044189453125, 0.0, 44.41905975341797] 8 [36.766700744628906, 28.13330078125, 41.78486251831055] 9 [58.34027862548828, 24.15105628967285, 33.58639144897461] 10 [78.90515899658203, 21.91446304321289, 30.72003936767578] 11 [58.26751708984375, 29.124631881713867, 16.945009231567383] 12 [90.89730834960938, 20.94156265258789, 20.576190948486328] 13 [123.30358123779297, 20.168087005615234, 27.747358322143555] 14 [137.18292236328125, 24.401538848876953, 40.60023498535156] 15 [125.56336975097656, 77.0707015991211, 115.94127655029297] step:2376/6710 train_time:529355ms step_avg:222.79ms step:2377/6710 train_time:529579ms step_avg:222.79ms step:2378/6710 train_time:529809ms step_avg:222.80ms step:2379/6710 train_time:530035ms step_avg:222.80ms step:2380/6710 train_time:530261ms step_avg:222.80ms step:2381/6710 train_time:530489ms step_avg:222.80ms step:2382/6710 train_time:530718ms step_avg:222.80ms step:2383/6710 train_time:530946ms step_avg:222.81ms step:2384/6710 train_time:531172ms step_avg:222.81ms step:2385/6710 train_time:531400ms step_avg:222.81ms step:2386/6710 train_time:531627ms step_avg:222.81ms step:2387/6710 train_time:531855ms step_avg:222.81ms step:2388/6710 train_time:532079ms step_avg:222.81ms step:2389/6710 train_time:532305ms step_avg:222.81ms step:2390/6710 train_time:532534ms step_avg:222.82ms step:2391/6710 train_time:532762ms step_avg:222.82ms step:2392/6710 train_time:532989ms step_avg:222.82ms step:2393/6710 train_time:533215ms step_avg:222.82ms step:2394/6710 train_time:533444ms step_avg:222.83ms step:2395/6710 train_time:533671ms step_avg:222.83ms step:2396/6710 train_time:533898ms step_avg:222.83ms step:2397/6710 train_time:534125ms step_avg:222.83ms step:2398/6710 train_time:534351ms step_avg:222.83ms step:2399/6710 train_time:534577ms step_avg:222.83ms step:2400/6710 train_time:534805ms step_avg:222.84ms step:2401/6710 train_time:535033ms step_avg:222.84ms step:2402/6710 train_time:535259ms step_avg:222.84ms step:2403/6710 train_time:535487ms step_avg:222.84ms step:2404/6710 train_time:535715ms step_avg:222.84ms step:2405/6710 train_time:535942ms step_avg:222.84ms step:2406/6710 train_time:536168ms step_avg:222.85ms step:2407/6710 train_time:536393ms step_avg:222.85ms step:2408/6710 train_time:536620ms step_avg:222.85ms step:2409/6710 train_time:536847ms step_avg:222.85ms step:2410/6710 train_time:537074ms step_avg:222.85ms step:2411/6710 train_time:537300ms step_avg:222.85ms step:2412/6710 train_time:537525ms step_avg:222.85ms step:2413/6710 train_time:537754ms step_avg:222.86ms step:2414/6710 train_time:537981ms step_avg:222.86ms step:2415/6710 train_time:538208ms step_avg:222.86ms step:2416/6710 train_time:538435ms step_avg:222.86ms step:2417/6710 train_time:538663ms step_avg:222.86ms step:2418/6710 train_time:538890ms step_avg:222.87ms step:2419/6710 train_time:539118ms step_avg:222.87ms step:2420/6710 train_time:539344ms step_avg:222.87ms step:2421/6710 train_time:539571ms step_avg:222.87ms step:2422/6710 train_time:539798ms step_avg:222.87ms step:2423/6710 train_time:540025ms step_avg:222.87ms step:2424/6710 train_time:540250ms step_avg:222.88ms step:2425/6710 train_time:540478ms step_avg:222.88ms step:2426/6710 train_time:540705ms step_avg:222.88ms step:2427/6710 train_time:540931ms step_avg:222.88ms step:2428/6710 train_time:541158ms step_avg:222.88ms step:2429/6710 train_time:541384ms step_avg:222.88ms step:2430/6710 train_time:541612ms step_avg:222.89ms step:2431/6710 train_time:541841ms step_avg:222.89ms step:2432/6710 train_time:542066ms step_avg:222.89ms step:2433/6710 train_time:542293ms step_avg:222.89ms step:2434/6710 train_time:542520ms step_avg:222.89ms step:2435/6710 train_time:542747ms step_avg:222.89ms step:2436/6710 train_time:542974ms step_avg:222.90ms step:2437/6710 train_time:543201ms step_avg:222.90ms step:2438/6710 train_time:543428ms step_avg:222.90ms step:2439/6710 train_time:543653ms step_avg:222.90ms step:2440/6710 train_time:543880ms step_avg:222.90ms step:2441/6710 train_time:544108ms step_avg:222.90ms step:2442/6710 train_time:544336ms step_avg:222.91ms step:2443/6710 train_time:544563ms step_avg:222.91ms step:2444/6710 train_time:544790ms step_avg:222.91ms step:2445/6710 train_time:545018ms step_avg:222.91ms step:2446/6710 train_time:545245ms step_avg:222.91ms step:2447/6710 train_time:545470ms step_avg:222.91ms step:2448/6710 train_time:545699ms step_avg:222.92ms step:2449/6710 train_time:545925ms step_avg:222.92ms step:2450/6710 train_time:546151ms step_avg:222.92ms step:2451/6710 train_time:546379ms step_avg:222.92ms step:2452/6710 train_time:546606ms step_avg:222.92ms step:2453/6710 train_time:546832ms step_avg:222.92ms step:2454/6710 train_time:547059ms step_avg:222.93ms step:2455/6710 train_time:547284ms step_avg:222.93ms step:2456/6710 train_time:547511ms step_avg:222.93ms step:2457/6710 train_time:547739ms step_avg:222.93ms step:2458/6710 train_time:547964ms step_avg:222.93ms step:2459/6710 train_time:548191ms step_avg:222.93ms step:2460/6710 train_time:548417ms step_avg:222.93ms step:2461/6710 train_time:548645ms step_avg:222.94ms step:2462/6710 train_time:548872ms step_avg:222.94ms step:2463/6710 train_time:549100ms step_avg:222.94ms step:2464/6710 train_time:549325ms step_avg:222.94ms step:2465/6710 train_time:549551ms step_avg:222.94ms step:2466/6710 train_time:549778ms step_avg:222.94ms step:2467/6710 train_time:550005ms step_avg:222.94ms step:2468/6710 train_time:550232ms step_avg:222.95ms step:2469/6710 train_time:550459ms step_avg:222.95ms step:2470/6710 train_time:550684ms step_avg:222.95ms step:2471/6710 train_time:550911ms step_avg:222.95ms step:2472/6710 train_time:551138ms step_avg:222.95ms step:2473/6710 train_time:551363ms step_avg:222.95ms step:2474/6710 train_time:551591ms step_avg:222.96ms step:2475/6710 train_time:551818ms step_avg:222.96ms step:2476/6710 train_time:552045ms step_avg:222.96ms step:2477/6710 train_time:552272ms step_avg:222.96ms step:2478/6710 train_time:552500ms step_avg:222.96ms step:2479/6710 train_time:552726ms step_avg:222.96ms step:2480/6710 train_time:552951ms step_avg:222.96ms step:2481/6710 train_time:553179ms step_avg:222.97ms step:2482/6710 train_time:553405ms step_avg:222.97ms step:2483/6710 train_time:553630ms step_avg:222.97ms step:2484/6710 train_time:553856ms step_avg:222.97ms step:2485/6710 train_time:554084ms step_avg:222.97ms step:2486/6710 train_time:554311ms step_avg:222.97ms step:2487/6710 train_time:554540ms step_avg:222.98ms step:2488/6710 train_time:554770ms step_avg:222.98ms step:2489/6710 train_time:555002ms step_avg:222.98ms step:2490/6710 train_time:555232ms step_avg:222.98ms step:2491/6710 train_time:555463ms step_avg:222.99ms step:2492/6710 train_time:555693ms step_avg:222.99ms step:2493/6710 train_time:555924ms step_avg:222.99ms step:2494/6710 train_time:556153ms step_avg:223.00ms step:2495/6710 train_time:556385ms step_avg:223.00ms step:2496/6710 train_time:556617ms step_avg:223.00ms step:2497/6710 train_time:556846ms step_avg:223.01ms step:2498/6710 train_time:557077ms step_avg:223.01ms step:2499/6710 train_time:557308ms step_avg:223.01ms step:2500/6710 train_time:557539ms step_avg:223.02ms step:2500/6710 val_loss:3.208945 train_time:557719ms step_avg:223.09ms Parameter containing: tensor([1.0000, 1.0000, 0.4178, 1.0000, 0.6428, 1.0000, 0.5365, 1.0000], device='cuda:0', requires_grad=True) 0 [6.3165998458862305, 5.316597938537598] 1 [0.5714928507804871, 5.280152320861816] 2 [0.8515905141830444, 4.146324634552002] 3 [0.6830865144729614, 3.331984043121338] 4 [0.32219019532203674, 2.357659339904785] 5 [0.7985422015190125, 3.6627309322357178] 6 [0.5173084735870361, 3.0333871841430664] 7 [0.8427752256393433, 5.1089253425598145] 8 [0.4195294976234436, 1.7588121891021729] 9 [0.509998083114624, 2.5856516361236572] 10 [0.6664231419563293, 2.8959994316101074] 11 [0.4404817819595337, 2.9132418632507324] 12 [1.0197548866271973, 5.301540374755859] 13 [1.0933681726455688, 3.2925515174865723] 14 [0.9799889326095581, 2.138740062713623] 15 [0.7947787046432495, 1.623855471611023] 0 [11.622275352478027, 24.283714294433594, 26.254894256591797] 1 [28.787778854370117, 24.992393493652344, 61.19075012207031] 2 [72.12246704101562, 21.807750701904297, 28.551584243774414] 3 [64.67705535888672, 27.118846893310547, 32.79475021362305] 4 [31.032331466674805, 25.024070739746094, 22.913068771362305] 5 [49.111961364746094, 23.61131477355957, 35.363433837890625] 6 [43.443748474121094, 26.47907829284668, 26.00617790222168] 7 [63.354454040527344, 0.0, 45.01793670654297] 8 [38.51601791381836, 28.83244514465332, 42.84025955200195] 9 [59.63932800292969, 24.851478576660156, 33.584800720214844] 10 [80.996337890625, 22.694480895996094, 31.214000701904297] 11 [60.6107177734375, 30.232412338256836, 17.32475471496582] 12 [92.7470474243164, 21.82701301574707, 20.842599868774414] 13 [125.6949691772461, 20.74209976196289, 27.671043395996094] 14 [139.2919464111328, 25.275081634521484, 40.37189483642578] 15 [127.91181182861328, 80.01412200927734, 119.86251831054688] step:2501/6710 train_time:557769ms step_avg:223.02ms step:2502/6710 train_time:557995ms step_avg:223.02ms step:2503/6710 train_time:558229ms step_avg:223.02ms step:2504/6710 train_time:558459ms step_avg:223.03ms step:2505/6710 train_time:558689ms step_avg:223.03ms step:2506/6710 train_time:558922ms step_avg:223.03ms step:2507/6710 train_time:559154ms step_avg:223.04ms step:2508/6710 train_time:559384ms step_avg:223.04ms step:2509/6710 train_time:559615ms step_avg:223.04ms step:2510/6710 train_time:559846ms step_avg:223.05ms step:2511/6710 train_time:560078ms step_avg:223.05ms step:2512/6710 train_time:560307ms step_avg:223.05ms step:2513/6710 train_time:560536ms step_avg:223.05ms step:2514/6710 train_time:560767ms step_avg:223.06ms step:2515/6710 train_time:561000ms step_avg:223.06ms step:2516/6710 train_time:561231ms step_avg:223.06ms step:2517/6710 train_time:561463ms step_avg:223.07ms step:2518/6710 train_time:561694ms step_avg:223.07ms step:2519/6710 train_time:561924ms step_avg:223.07ms step:2520/6710 train_time:562157ms step_avg:223.08ms step:2521/6710 train_time:562387ms step_avg:223.08ms step:2522/6710 train_time:562618ms step_avg:223.08ms step:2523/6710 train_time:562849ms step_avg:223.09ms step:2524/6710 train_time:563081ms step_avg:223.09ms step:2525/6710 train_time:563314ms step_avg:223.09ms step:2526/6710 train_time:563545ms step_avg:223.10ms step:2527/6710 train_time:563776ms step_avg:223.10ms step:2528/6710 train_time:564005ms step_avg:223.10ms step:2529/6710 train_time:564236ms step_avg:223.11ms step:2530/6710 train_time:564467ms step_avg:223.11ms step:2531/6710 train_time:564699ms step_avg:223.11ms step:2532/6710 train_time:564928ms step_avg:223.12ms step:2533/6710 train_time:565159ms step_avg:223.12ms step:2534/6710 train_time:565390ms step_avg:223.12ms step:2535/6710 train_time:565620ms step_avg:223.12ms step:2536/6710 train_time:565850ms step_avg:223.13ms step:2537/6710 train_time:566081ms step_avg:223.13ms step:2538/6710 train_time:566312ms step_avg:223.13ms step:2539/6710 train_time:566544ms step_avg:223.14ms step:2540/6710 train_time:566775ms step_avg:223.14ms step:2541/6710 train_time:567007ms step_avg:223.14ms step:2542/6710 train_time:567239ms step_avg:223.15ms step:2543/6710 train_time:567471ms step_avg:223.15ms step:2544/6710 train_time:567701ms step_avg:223.15ms step:2545/6710 train_time:567930ms step_avg:223.16ms step:2546/6710 train_time:568162ms step_avg:223.16ms step:2547/6710 train_time:568394ms step_avg:223.16ms step:2548/6710 train_time:568623ms step_avg:223.16ms step:2549/6710 train_time:568854ms step_avg:223.17ms step:2550/6710 train_time:569084ms step_avg:223.17ms step:2551/6710 train_time:569315ms step_avg:223.17ms step:2552/6710 train_time:569546ms step_avg:223.18ms step:2553/6710 train_time:569777ms step_avg:223.18ms step:2554/6710 train_time:570006ms step_avg:223.18ms step:2555/6710 train_time:570237ms step_avg:223.18ms step:2556/6710 train_time:570469ms step_avg:223.19ms step:2557/6710 train_time:570700ms step_avg:223.19ms step:2558/6710 train_time:570931ms step_avg:223.19ms step:2559/6710 train_time:571162ms step_avg:223.20ms step:2560/6710 train_time:571394ms step_avg:223.20ms step:2561/6710 train_time:571624ms step_avg:223.20ms step:2562/6710 train_time:571856ms step_avg:223.21ms step:2563/6710 train_time:572087ms step_avg:223.21ms step:2564/6710 train_time:572318ms step_avg:223.21ms step:2565/6710 train_time:572548ms step_avg:223.22ms step:2566/6710 train_time:572780ms step_avg:223.22ms step:2567/6710 train_time:573011ms step_avg:223.22ms step:2568/6710 train_time:573243ms step_avg:223.23ms step:2569/6710 train_time:573475ms step_avg:223.23ms step:2570/6710 train_time:573706ms step_avg:223.23ms step:2571/6710 train_time:573938ms step_avg:223.24ms step:2572/6710 train_time:574169ms step_avg:223.24ms step:2573/6710 train_time:574400ms step_avg:223.24ms step:2574/6710 train_time:574632ms step_avg:223.24ms step:2575/6710 train_time:574861ms step_avg:223.25ms step:2576/6710 train_time:575094ms step_avg:223.25ms step:2577/6710 train_time:575324ms step_avg:223.25ms step:2578/6710 train_time:575556ms step_avg:223.26ms step:2579/6710 train_time:575785ms step_avg:223.26ms step:2580/6710 train_time:576016ms step_avg:223.26ms step:2581/6710 train_time:576246ms step_avg:223.26ms step:2582/6710 train_time:576478ms step_avg:223.27ms step:2583/6710 train_time:576708ms step_avg:223.27ms step:2584/6710 train_time:576940ms step_avg:223.27ms step:2585/6710 train_time:577170ms step_avg:223.28ms step:2586/6710 train_time:577401ms step_avg:223.28ms step:2587/6710 train_time:577633ms step_avg:223.28ms step:2588/6710 train_time:577862ms step_avg:223.29ms step:2589/6710 train_time:578094ms step_avg:223.29ms step:2590/6710 train_time:578325ms step_avg:223.29ms step:2591/6710 train_time:578559ms step_avg:223.30ms step:2592/6710 train_time:578788ms step_avg:223.30ms step:2593/6710 train_time:579019ms step_avg:223.30ms step:2594/6710 train_time:579249ms step_avg:223.30ms step:2595/6710 train_time:579482ms step_avg:223.31ms step:2596/6710 train_time:579713ms step_avg:223.31ms step:2597/6710 train_time:579944ms step_avg:223.31ms step:2598/6710 train_time:580176ms step_avg:223.32ms step:2599/6710 train_time:580407ms step_avg:223.32ms step:2600/6710 train_time:580639ms step_avg:223.32ms step:2601/6710 train_time:580871ms step_avg:223.33ms step:2602/6710 train_time:581102ms step_avg:223.33ms step:2603/6710 train_time:581333ms step_avg:223.33ms step:2604/6710 train_time:581563ms step_avg:223.33ms step:2605/6710 train_time:581795ms step_avg:223.34ms step:2606/6710 train_time:582024ms step_avg:223.34ms step:2607/6710 train_time:582256ms step_avg:223.34ms step:2608/6710 train_time:582485ms step_avg:223.35ms step:2609/6710 train_time:582717ms step_avg:223.35ms step:2610/6710 train_time:582948ms step_avg:223.35ms step:2611/6710 train_time:583179ms step_avg:223.35ms step:2612/6710 train_time:583408ms step_avg:223.36ms step:2613/6710 train_time:583639ms step_avg:223.36ms step:2614/6710 train_time:583872ms step_avg:223.36ms step:2615/6710 train_time:584103ms step_avg:223.37ms step:2616/6710 train_time:584334ms step_avg:223.37ms step:2617/6710 train_time:584563ms step_avg:223.37ms step:2618/6710 train_time:584794ms step_avg:223.37ms step:2619/6710 train_time:585026ms step_avg:223.38ms step:2620/6710 train_time:585258ms step_avg:223.38ms step:2621/6710 train_time:585486ms step_avg:223.38ms step:2622/6710 train_time:585718ms step_avg:223.39ms step:2623/6710 train_time:585949ms step_avg:223.39ms step:2624/6710 train_time:586180ms step_avg:223.39ms step:2625/6710 train_time:586413ms step_avg:223.40ms step:2625/6710 val_loss:3.199776 train_time:586594ms step_avg:223.46ms Parameter containing: tensor([1.0000, 1.0000, 0.4110, 1.0000, 0.6363, 1.0000, 0.5440, 1.0000], device='cuda:0', requires_grad=True) 0 [6.5014238357543945, 5.501421928405762] 1 [0.5618438124656677, 5.4843058586120605] 2 [0.8438237905502319, 4.259422302246094] 3 [0.6779186129570007, 3.4395103454589844] 4 [0.32495835423469543, 2.4442567825317383] 5 [0.7826259136199951, 3.757211208343506] 6 [0.507611095905304, 3.0865628719329834] 7 [0.8284491896629333, 5.294367790222168] 8 [0.41561195254325867, 1.7853089570999146] 9 [0.4957413673400879, 2.64128041267395] 10 [0.6608564853668213, 2.9441840648651123] 11 [0.43820759654045105, 2.986499309539795] 12 [1.0032613277435303, 5.481849670410156] 13 [1.0943788290023804, 3.367177724838257] 14 [0.9833181500434875, 2.13335919380188] 15 [0.7958052158355713, 1.5712023973464966] 0 [11.990609169006348, 24.88360595703125, 27.165040969848633] 1 [29.229177474975586, 25.840988159179688, 63.188106536865234] 2 [73.44281005859375, 22.55748748779297, 29.48409652709961] 3 [65.60260772705078, 28.203826904296875, 34.28758239746094] 4 [32.06129455566406, 25.63201141357422, 24.224842071533203] 5 [49.81536102294922, 24.451141357421875, 36.48729705810547] 6 [43.60538864135742, 27.537330627441406, 26.55550193786621] 7 [63.25858688354492, 0.0, 46.160728454589844] 8 [38.49250793457031, 29.851852416992188, 43.8000602722168] 9 [58.97886657714844, 25.516494750976562, 34.399898529052734] 10 [80.8646011352539, 23.91033935546875, 32.53035354614258] 11 [60.92881393432617, 31.215801239013672, 18.09241485595703] 12 [92.81011199951172, 22.893129348754883, 21.402996063232422] 13 [127.00323486328125, 21.32598876953125, 28.582677841186523] 14 [141.7535400390625, 25.90373420715332, 41.885467529296875] 15 [131.0399627685547, 83.11321258544922, 128.06898498535156] step:2626/6710 train_time:586644ms step_avg:223.40ms step:2627/6710 train_time:586872ms step_avg:223.40ms step:2628/6710 train_time:587108ms step_avg:223.41ms step:2629/6710 train_time:587336ms step_avg:223.41ms step:2630/6710 train_time:587567ms step_avg:223.41ms step:2631/6710 train_time:587799ms step_avg:223.41ms step:2632/6710 train_time:588031ms step_avg:223.42ms step:2633/6710 train_time:588261ms step_avg:223.42ms step:2634/6710 train_time:588491ms step_avg:223.42ms step:2635/6710 train_time:588723ms step_avg:223.42ms step:2636/6710 train_time:588952ms step_avg:223.43ms step:2637/6710 train_time:589184ms step_avg:223.43ms step:2638/6710 train_time:589414ms step_avg:223.43ms step:2639/6710 train_time:589644ms step_avg:223.43ms step:2640/6710 train_time:589874ms step_avg:223.44ms step:2641/6710 train_time:590105ms step_avg:223.44ms step:2642/6710 train_time:590336ms step_avg:223.44ms step:2643/6710 train_time:590565ms step_avg:223.45ms step:2644/6710 train_time:590796ms step_avg:223.45ms step:2645/6710 train_time:591029ms step_avg:223.45ms step:2646/6710 train_time:591260ms step_avg:223.45ms step:2647/6710 train_time:591490ms step_avg:223.46ms step:2648/6710 train_time:591722ms step_avg:223.46ms step:2649/6710 train_time:591951ms step_avg:223.46ms step:2650/6710 train_time:592182ms step_avg:223.46ms step:2651/6710 train_time:592411ms step_avg:223.47ms step:2652/6710 train_time:592642ms step_avg:223.47ms step:2653/6710 train_time:592873ms step_avg:223.47ms step:2654/6710 train_time:593103ms step_avg:223.48ms step:2655/6710 train_time:593334ms step_avg:223.48ms step:2656/6710 train_time:593565ms step_avg:223.48ms step:2657/6710 train_time:593796ms step_avg:223.48ms step:2658/6710 train_time:594026ms step_avg:223.49ms step:2659/6710 train_time:594257ms step_avg:223.49ms step:2660/6710 train_time:594488ms step_avg:223.49ms step:2661/6710 train_time:594719ms step_avg:223.49ms step:2662/6710 train_time:594950ms step_avg:223.50ms step:2663/6710 train_time:595441ms step_avg:223.60ms step:2664/6710 train_time:595668ms step_avg:223.60ms step:2665/6710 train_time:595896ms step_avg:223.60ms step:2666/6710 train_time:596123ms step_avg:223.60ms step:2667/6710 train_time:596358ms step_avg:223.61ms step:2668/6710 train_time:596592ms step_avg:223.61ms step:2669/6710 train_time:596823ms step_avg:223.61ms step:2670/6710 train_time:597050ms step_avg:223.61ms step:2671/6710 train_time:597280ms step_avg:223.62ms step:2672/6710 train_time:597513ms step_avg:223.62ms step:2673/6710 train_time:597745ms step_avg:223.62ms step:2674/6710 train_time:597975ms step_avg:223.63ms step:2675/6710 train_time:598205ms step_avg:223.63ms step:2676/6710 train_time:598438ms step_avg:223.63ms step:2677/6710 train_time:598668ms step_avg:223.63ms step:2678/6710 train_time:598897ms step_avg:223.64ms step:2679/6710 train_time:599130ms step_avg:223.64ms step:2680/6710 train_time:599363ms step_avg:223.64ms step:2681/6710 train_time:599594ms step_avg:223.65ms step:2682/6710 train_time:599825ms step_avg:223.65ms step:2683/6710 train_time:600056ms step_avg:223.65ms step:2684/6710 train_time:600285ms step_avg:223.65ms step:2685/6710 train_time:600516ms step_avg:223.66ms step:2686/6710 train_time:600747ms step_avg:223.66ms step:2687/6710 train_time:600978ms step_avg:223.66ms step:2688/6710 train_time:601207ms step_avg:223.66ms step:2689/6710 train_time:601437ms step_avg:223.67ms step:2690/6710 train_time:601668ms step_avg:223.67ms step:2691/6710 train_time:601897ms step_avg:223.67ms step:2692/6710 train_time:602129ms step_avg:223.67ms step:2693/6710 train_time:602360ms step_avg:223.68ms step:2694/6710 train_time:602589ms step_avg:223.68ms step:2695/6710 train_time:602821ms step_avg:223.68ms step:2696/6710 train_time:603053ms step_avg:223.68ms step:2697/6710 train_time:603284ms step_avg:223.69ms step:2698/6710 train_time:603514ms step_avg:223.69ms step:2699/6710 train_time:603744ms step_avg:223.69ms step:2700/6710 train_time:603976ms step_avg:223.69ms step:2701/6710 train_time:604206ms step_avg:223.70ms step:2702/6710 train_time:604437ms step_avg:223.70ms step:2703/6710 train_time:604667ms step_avg:223.70ms step:2704/6710 train_time:604899ms step_avg:223.71ms step:2705/6710 train_time:605130ms step_avg:223.71ms step:2706/6710 train_time:605360ms step_avg:223.71ms step:2707/6710 train_time:605591ms step_avg:223.71ms step:2708/6710 train_time:605822ms step_avg:223.72ms step:2709/6710 train_time:606053ms step_avg:223.72ms step:2710/6710 train_time:606285ms step_avg:223.72ms step:2711/6710 train_time:606515ms step_avg:223.72ms step:2712/6710 train_time:606746ms step_avg:223.73ms step:2713/6710 train_time:606977ms step_avg:223.73ms step:2714/6710 train_time:607210ms step_avg:223.73ms step:2715/6710 train_time:607441ms step_avg:223.74ms step:2716/6710 train_time:607671ms step_avg:223.74ms step:2717/6710 train_time:607904ms step_avg:223.74ms step:2718/6710 train_time:608134ms step_avg:223.74ms step:2719/6710 train_time:608365ms step_avg:223.75ms step:2720/6710 train_time:608594ms step_avg:223.75ms step:2721/6710 train_time:608825ms step_avg:223.75ms step:2722/6710 train_time:609057ms step_avg:223.75ms step:2723/6710 train_time:609287ms step_avg:223.76ms step:2724/6710 train_time:609519ms step_avg:223.76ms step:2725/6710 train_time:609749ms step_avg:223.76ms step:2726/6710 train_time:609979ms step_avg:223.76ms step:2727/6710 train_time:610211ms step_avg:223.77ms step:2728/6710 train_time:610440ms step_avg:223.77ms step:2729/6710 train_time:610672ms step_avg:223.77ms step:2730/6710 train_time:610905ms step_avg:223.77ms step:2731/6710 train_time:611132ms step_avg:223.78ms step:2732/6710 train_time:611364ms step_avg:223.78ms step:2733/6710 train_time:611593ms step_avg:223.78ms step:2734/6710 train_time:611826ms step_avg:223.78ms step:2735/6710 train_time:612056ms step_avg:223.79ms step:2736/6710 train_time:612286ms step_avg:223.79ms step:2737/6710 train_time:612517ms step_avg:223.79ms step:2738/6710 train_time:612748ms step_avg:223.79ms step:2739/6710 train_time:612980ms step_avg:223.80ms step:2740/6710 train_time:613210ms step_avg:223.80ms step:2741/6710 train_time:613440ms step_avg:223.80ms step:2742/6710 train_time:613668ms step_avg:223.80ms step:2743/6710 train_time:613899ms step_avg:223.81ms step:2744/6710 train_time:614131ms step_avg:223.81ms step:2745/6710 train_time:614361ms step_avg:223.81ms step:2746/6710 train_time:614589ms step_avg:223.81ms step:2747/6710 train_time:614820ms step_avg:223.82ms step:2748/6710 train_time:615050ms step_avg:223.82ms step:2749/6710 train_time:615281ms step_avg:223.82ms step:2750/6710 train_time:615512ms step_avg:223.82ms step:2750/6710 val_loss:3.191684 train_time:615694ms step_avg:223.89ms Parameter containing: tensor([1.0000, 1.0000, 0.4157, 1.0000, 0.6279, 1.0000, 0.5462, 1.0000], device='cuda:0', requires_grad=True) 0 [6.670017719268799, 5.670015811920166] 1 [0.5566691160202026, 5.662166595458984] 2 [0.8389444351196289, 4.399772644042969] 3 [0.6860861778259277, 3.5564279556274414] 4 [0.327474445104599, 2.543102502822876] 5 [0.7730721235275269, 3.8541951179504395] 6 [0.5027992725372314, 3.1432180404663086] 7 [0.8153812885284424, 5.451178550720215] 8 [0.4238044321537018, 1.793317198753357] 9 [0.4866434931755066, 2.6599178314208984] 10 [0.6657369136810303, 3.0076775550842285] 11 [0.43976065516471863, 3.075023889541626] 12 [0.9883727431297302, 5.66616678237915] 13 [1.0833818912506104, 3.4699902534484863] 14 [0.9803891777992249, 2.156489849090576] 15 [0.8038855195045471, 1.549780249595642] 0 [12.328841209411621, 25.69003677368164, 28.18328857421875] 1 [29.824373245239258, 26.63043212890625, 65.8513412475586] 2 [75.70655822753906, 23.216283798217773, 30.004125595092773] 3 [68.1041030883789, 28.894134521484375, 35.448646545410156] 4 [33.339176177978516, 26.269968032836914, 25.102954864501953] 5 [50.72652816772461, 25.273984909057617, 37.71523666381836] 6 [44.259864807128906, 28.375288009643555, 27.620494842529297] 7 [63.765846252441406, 0.0, 46.99123764038086] 8 [39.64952850341797, 30.62839126586914, 45.63544464111328] 9 [59.62337112426758, 26.320947647094727, 35.66709899902344] 10 [82.70233154296875, 24.74732208251953, 33.88386535644531] 11 [62.7632942199707, 31.915830612182617, 19.130748748779297] 12 [94.1493911743164, 23.53624725341797, 22.27894401550293] 13 [128.01280212402344, 22.136890411376953, 29.621585845947266] 14 [142.9390869140625, 26.83336639404297, 43.0728874206543] 15 [134.08615112304688, 85.25421142578125, 134.4750518798828] step:2751/6710 train_time:615744ms step_avg:223.83ms step:2752/6710 train_time:615970ms step_avg:223.83ms step:2753/6710 train_time:616207ms step_avg:223.83ms step:2754/6710 train_time:616437ms step_avg:223.83ms step:2755/6710 train_time:616668ms step_avg:223.84ms step:2756/6710 train_time:616901ms step_avg:223.84ms step:2757/6710 train_time:617133ms step_avg:223.84ms step:2758/6710 train_time:617363ms step_avg:223.84ms step:2759/6710 train_time:617593ms step_avg:223.85ms step:2760/6710 train_time:617822ms step_avg:223.85ms step:2761/6710 train_time:618054ms step_avg:223.85ms step:2762/6710 train_time:618285ms step_avg:223.85ms step:2763/6710 train_time:618515ms step_avg:223.86ms step:2764/6710 train_time:618746ms step_avg:223.86ms step:2765/6710 train_time:618977ms step_avg:223.86ms step:2766/6710 train_time:619208ms step_avg:223.86ms step:2767/6710 train_time:619439ms step_avg:223.87ms step:2768/6710 train_time:619668ms step_avg:223.87ms step:2769/6710 train_time:619900ms step_avg:223.87ms step:2770/6710 train_time:620132ms step_avg:223.87ms step:2771/6710 train_time:620361ms step_avg:223.88ms step:2772/6710 train_time:620591ms step_avg:223.88ms step:2773/6710 train_time:620820ms step_avg:223.88ms step:2774/6710 train_time:621051ms step_avg:223.88ms step:2775/6710 train_time:621282ms step_avg:223.89ms step:2776/6710 train_time:621514ms step_avg:223.89ms step:2777/6710 train_time:621744ms step_avg:223.89ms step:2778/6710 train_time:621974ms step_avg:223.89ms step:2779/6710 train_time:622205ms step_avg:223.90ms step:2780/6710 train_time:622435ms step_avg:223.90ms step:2781/6710 train_time:622667ms step_avg:223.90ms step:2782/6710 train_time:622896ms step_avg:223.90ms step:2783/6710 train_time:623129ms step_avg:223.91ms step:2784/6710 train_time:623360ms step_avg:223.91ms step:2785/6710 train_time:623591ms step_avg:223.91ms step:2786/6710 train_time:623821ms step_avg:223.91ms step:2787/6710 train_time:624051ms step_avg:223.91ms step:2788/6710 train_time:624280ms step_avg:223.92ms step:2789/6710 train_time:624512ms step_avg:223.92ms step:2790/6710 train_time:624742ms step_avg:223.92ms step:2791/6710 train_time:624974ms step_avg:223.92ms step:2792/6710 train_time:625204ms step_avg:223.93ms step:2793/6710 train_time:625435ms step_avg:223.93ms step:2794/6710 train_time:625665ms step_avg:223.93ms step:2795/6710 train_time:625896ms step_avg:223.93ms step:2796/6710 train_time:626126ms step_avg:223.94ms step:2797/6710 train_time:626357ms step_avg:223.94ms step:2798/6710 train_time:626589ms step_avg:223.94ms step:2799/6710 train_time:626820ms step_avg:223.94ms step:2800/6710 train_time:627052ms step_avg:223.95ms step:2801/6710 train_time:627280ms step_avg:223.95ms step:2802/6710 train_time:627512ms step_avg:223.95ms step:2803/6710 train_time:627741ms step_avg:223.95ms step:2804/6710 train_time:627972ms step_avg:223.96ms step:2805/6710 train_time:628200ms step_avg:223.96ms step:2806/6710 train_time:628431ms step_avg:223.96ms step:2807/6710 train_time:628664ms step_avg:223.96ms step:2808/6710 train_time:628895ms step_avg:223.97ms step:2809/6710 train_time:629124ms step_avg:223.97ms step:2810/6710 train_time:629355ms step_avg:223.97ms step:2811/6710 train_time:629585ms step_avg:223.97ms step:2812/6710 train_time:629817ms step_avg:223.97ms step:2813/6710 train_time:630047ms step_avg:223.98ms step:2814/6710 train_time:630278ms step_avg:223.98ms step:2815/6710 train_time:630508ms step_avg:223.98ms step:2816/6710 train_time:630739ms step_avg:223.98ms step:2817/6710 train_time:630970ms step_avg:223.99ms step:2818/6710 train_time:631200ms step_avg:223.99ms step:2819/6710 train_time:631432ms step_avg:223.99ms step:2820/6710 train_time:631661ms step_avg:223.99ms step:2821/6710 train_time:631893ms step_avg:224.00ms step:2822/6710 train_time:632123ms step_avg:224.00ms step:2823/6710 train_time:632354ms step_avg:224.00ms step:2824/6710 train_time:632584ms step_avg:224.00ms step:2825/6710 train_time:632814ms step_avg:224.01ms step:2826/6710 train_time:633045ms step_avg:224.01ms step:2827/6710 train_time:633276ms step_avg:224.01ms step:2828/6710 train_time:633509ms step_avg:224.01ms step:2829/6710 train_time:633739ms step_avg:224.02ms step:2830/6710 train_time:633969ms step_avg:224.02ms step:2831/6710 train_time:634199ms step_avg:224.02ms step:2832/6710 train_time:634430ms step_avg:224.02ms step:2833/6710 train_time:634661ms step_avg:224.02ms step:2834/6710 train_time:634892ms step_avg:224.03ms step:2835/6710 train_time:635122ms step_avg:224.03ms step:2836/6710 train_time:635352ms step_avg:224.03ms step:2837/6710 train_time:635584ms step_avg:224.03ms step:2838/6710 train_time:635815ms step_avg:224.04ms step:2839/6710 train_time:636045ms step_avg:224.04ms step:2840/6710 train_time:636276ms step_avg:224.04ms step:2841/6710 train_time:636508ms step_avg:224.04ms step:2842/6710 train_time:636740ms step_avg:224.05ms step:2843/6710 train_time:636972ms step_avg:224.05ms step:2844/6710 train_time:637201ms step_avg:224.05ms step:2845/6710 train_time:637434ms step_avg:224.05ms step:2846/6710 train_time:637666ms step_avg:224.06ms step:2847/6710 train_time:637897ms step_avg:224.06ms step:2848/6710 train_time:638128ms step_avg:224.06ms step:2849/6710 train_time:638356ms step_avg:224.06ms step:2850/6710 train_time:638588ms step_avg:224.07ms step:2851/6710 train_time:638819ms step_avg:224.07ms step:2852/6710 train_time:639049ms step_avg:224.07ms step:2853/6710 train_time:639278ms step_avg:224.07ms step:2854/6710 train_time:639508ms step_avg:224.07ms step:2855/6710 train_time:639741ms step_avg:224.08ms step:2856/6710 train_time:639972ms step_avg:224.08ms step:2857/6710 train_time:640201ms step_avg:224.08ms step:2858/6710 train_time:640432ms step_avg:224.08ms step:2859/6710 train_time:640665ms step_avg:224.09ms step:2860/6710 train_time:640895ms step_avg:224.09ms step:2861/6710 train_time:641125ms step_avg:224.09ms step:2862/6710 train_time:641357ms step_avg:224.09ms step:2863/6710 train_time:641587ms step_avg:224.10ms step:2864/6710 train_time:641818ms step_avg:224.10ms step:2865/6710 train_time:642049ms step_avg:224.10ms step:2866/6710 train_time:642280ms step_avg:224.10ms step:2867/6710 train_time:642512ms step_avg:224.11ms step:2868/6710 train_time:642742ms step_avg:224.11ms step:2869/6710 train_time:642974ms step_avg:224.11ms step:2870/6710 train_time:643205ms step_avg:224.11ms step:2871/6710 train_time:643437ms step_avg:224.12ms step:2872/6710 train_time:643667ms step_avg:224.12ms step:2873/6710 train_time:643898ms step_avg:224.12ms step:2874/6710 train_time:644130ms step_avg:224.12ms step:2875/6710 train_time:644362ms step_avg:224.13ms step:2875/6710 val_loss:3.180766 train_time:644544ms step_avg:224.19ms Parameter containing: tensor([1.0000, 1.0000, 0.4179, 1.0000, 0.6221, 1.0000, 0.5329, 1.0000], device='cuda:0', requires_grad=True) 0 [6.817691802978516, 5.817689895629883] 1 [0.5558956861495972, 5.81285285949707] 2 [0.8256567716598511, 4.4802751541137695] 3 [0.6820293068885803, 3.6418561935424805] 4 [0.3276706337928772, 2.5996906757354736] 5 [0.7775141596794128, 3.922243118286133] 6 [0.5039522647857666, 3.172987937927246] 7 [0.8198412656784058, 5.545584678649902] 8 [0.4270963668823242, 1.7549015283584595] 9 [0.49195125699043274, 2.648024559020996] 10 [0.6609604358673096, 3.040310859680176] 11 [0.43339836597442627, 3.108356237411499] 12 [0.9869077801704407, 5.785398483276367] 13 [1.0893640518188477, 3.50777530670166] 14 [0.9797568917274475, 2.1190872192382812] 15 [0.8052391409873962, 1.484220266342163] 0 [12.625351905822754, 26.259063720703125, 28.680633544921875] 1 [30.37606430053711, 27.17892837524414, 67.64915466308594] 2 [76.25652313232422, 23.555145263671875, 30.613927841186523] 3 [68.35774230957031, 29.53705406188965, 36.2055778503418] 4 [33.709999084472656, 26.688798904418945, 26.10700035095215] 5 [51.89332962036133, 25.916542053222656, 38.305816650390625] 6 [45.19303512573242, 29.072153091430664, 27.70685386657715] 7 [65.00586700439453, 0.0, 47.56991195678711] 8 [40.61192321777344, 31.332334518432617, 46.40891647338867] 9 [60.852542877197266, 26.849332809448242, 35.95358657836914] 10 [83.26922607421875, 25.496143341064453, 34.33468246459961] 11 [62.58591842651367, 32.67646026611328, 19.125469207763672] 12 [94.38752746582031, 24.403343200683594, 22.143756866455078] 13 [129.42437744140625, 22.1199951171875, 29.569677352905273] 14 [144.2627410888672, 26.78122329711914, 42.798770904541016] 15 [135.19407653808594, 87.7392349243164, 138.3953857421875] step:2876/6710 train_time:644593ms step_avg:224.13ms step:2877/6710 train_time:644821ms step_avg:224.13ms step:2878/6710 train_time:645055ms step_avg:224.13ms step:2879/6710 train_time:645284ms step_avg:224.13ms step:2880/6710 train_time:645518ms step_avg:224.14ms step:2881/6710 train_time:645750ms step_avg:224.14ms step:2882/6710 train_time:645980ms step_avg:224.14ms step:2883/6710 train_time:646210ms step_avg:224.15ms step:2884/6710 train_time:646439ms step_avg:224.15ms step:2885/6710 train_time:646669ms step_avg:224.15ms step:2886/6710 train_time:646899ms step_avg:224.15ms step:2887/6710 train_time:647130ms step_avg:224.15ms step:2888/6710 train_time:647360ms step_avg:224.16ms step:2889/6710 train_time:647591ms step_avg:224.16ms step:2890/6710 train_time:647821ms step_avg:224.16ms step:2891/6710 train_time:648053ms step_avg:224.16ms step:2892/6710 train_time:648284ms step_avg:224.16ms step:2893/6710 train_time:648514ms step_avg:224.17ms step:2894/6710 train_time:648744ms step_avg:224.17ms step:2895/6710 train_time:648975ms step_avg:224.17ms step:2896/6710 train_time:649206ms step_avg:224.17ms step:2897/6710 train_time:649437ms step_avg:224.18ms step:2898/6710 train_time:649667ms step_avg:224.18ms step:2899/6710 train_time:649898ms step_avg:224.18ms step:2900/6710 train_time:650129ms step_avg:224.18ms step:2901/6710 train_time:650360ms step_avg:224.18ms step:2902/6710 train_time:650591ms step_avg:224.19ms step:2903/6710 train_time:650821ms step_avg:224.19ms step:2904/6710 train_time:651052ms step_avg:224.19ms step:2905/6710 train_time:651284ms step_avg:224.19ms step:2906/6710 train_time:651515ms step_avg:224.20ms step:2907/6710 train_time:651746ms step_avg:224.20ms step:2908/6710 train_time:651977ms step_avg:224.20ms step:2909/6710 train_time:652208ms step_avg:224.20ms step:2910/6710 train_time:652439ms step_avg:224.21ms step:2911/6710 train_time:652670ms step_avg:224.21ms step:2912/6710 train_time:652902ms step_avg:224.21ms step:2913/6710 train_time:653133ms step_avg:224.21ms step:2914/6710 train_time:653363ms step_avg:224.22ms step:2915/6710 train_time:653593ms step_avg:224.22ms step:2916/6710 train_time:653823ms step_avg:224.22ms step:2917/6710 train_time:654054ms step_avg:224.22ms step:2918/6710 train_time:654285ms step_avg:224.22ms step:2919/6710 train_time:654514ms step_avg:224.23ms step:2920/6710 train_time:654743ms step_avg:224.23ms step:2921/6710 train_time:654975ms step_avg:224.23ms step:2922/6710 train_time:655205ms step_avg:224.23ms step:2923/6710 train_time:655435ms step_avg:224.23ms step:2924/6710 train_time:655664ms step_avg:224.24ms step:2925/6710 train_time:655895ms step_avg:224.24ms step:2926/6710 train_time:656126ms step_avg:224.24ms step:2927/6710 train_time:656357ms step_avg:224.24ms step:2928/6710 train_time:656586ms step_avg:224.24ms step:2929/6710 train_time:656817ms step_avg:224.25ms step:2930/6710 train_time:657048ms step_avg:224.25ms step:2931/6710 train_time:657280ms step_avg:224.25ms step:2932/6710 train_time:657510ms step_avg:224.25ms step:2933/6710 train_time:657740ms step_avg:224.26ms step:2934/6710 train_time:657972ms step_avg:224.26ms step:2935/6710 train_time:658202ms step_avg:224.26ms step:2936/6710 train_time:658433ms step_avg:224.26ms step:2937/6710 train_time:658662ms step_avg:224.26ms step:2938/6710 train_time:658892ms step_avg:224.27ms step:2939/6710 train_time:659120ms step_avg:224.27ms step:2940/6710 train_time:659351ms step_avg:224.27ms step:2941/6710 train_time:659580ms step_avg:224.27ms step:2942/6710 train_time:659811ms step_avg:224.27ms step:2943/6710 train_time:660041ms step_avg:224.27ms step:2944/6710 train_time:660272ms step_avg:224.28ms step:2945/6710 train_time:660503ms step_avg:224.28ms step:2946/6710 train_time:660734ms step_avg:224.28ms step:2947/6710 train_time:660963ms step_avg:224.28ms step:2948/6710 train_time:661194ms step_avg:224.29ms step:2949/6710 train_time:661424ms step_avg:224.29ms step:2950/6710 train_time:661655ms step_avg:224.29ms step:2951/6710 train_time:661886ms step_avg:224.29ms step:2952/6710 train_time:662117ms step_avg:224.29ms step:2953/6710 train_time:662346ms step_avg:224.30ms step:2954/6710 train_time:662575ms step_avg:224.30ms step:2955/6710 train_time:662806ms step_avg:224.30ms step:2956/6710 train_time:663037ms step_avg:224.30ms step:2957/6710 train_time:663267ms step_avg:224.30ms step:2958/6710 train_time:663498ms step_avg:224.31ms step:2959/6710 train_time:663729ms step_avg:224.31ms step:2960/6710 train_time:663961ms step_avg:224.31ms step:2961/6710 train_time:664191ms step_avg:224.31ms step:2962/6710 train_time:664421ms step_avg:224.31ms step:2963/6710 train_time:664649ms step_avg:224.32ms step:2964/6710 train_time:664880ms step_avg:224.32ms step:2965/6710 train_time:665112ms step_avg:224.32ms step:2966/6710 train_time:665341ms step_avg:224.32ms step:2967/6710 train_time:665572ms step_avg:224.32ms step:2968/6710 train_time:665802ms step_avg:224.33ms step:2969/6710 train_time:666033ms step_avg:224.33ms step:2970/6710 train_time:666264ms step_avg:224.33ms step:2971/6710 train_time:666496ms step_avg:224.33ms step:2972/6710 train_time:666728ms step_avg:224.34ms step:2973/6710 train_time:666959ms step_avg:224.34ms step:2974/6710 train_time:667190ms step_avg:224.34ms step:2975/6710 train_time:667420ms step_avg:224.34ms step:2976/6710 train_time:667651ms step_avg:224.35ms step:2977/6710 train_time:667881ms step_avg:224.35ms step:2978/6710 train_time:668112ms step_avg:224.35ms step:2979/6710 train_time:668341ms step_avg:224.35ms step:2980/6710 train_time:668572ms step_avg:224.35ms step:2981/6710 train_time:668803ms step_avg:224.36ms step:2982/6710 train_time:669033ms step_avg:224.36ms step:2983/6710 train_time:669263ms step_avg:224.36ms step:2984/6710 train_time:669494ms step_avg:224.36ms step:2985/6710 train_time:669725ms step_avg:224.36ms step:2986/6710 train_time:669956ms step_avg:224.37ms step:2987/6710 train_time:670188ms step_avg:224.37ms step:2988/6710 train_time:670419ms step_avg:224.37ms step:2989/6710 train_time:670651ms step_avg:224.37ms step:2990/6710 train_time:670883ms step_avg:224.38ms step:2991/6710 train_time:671116ms step_avg:224.38ms step:2992/6710 train_time:671347ms step_avg:224.38ms step:2993/6710 train_time:671577ms step_avg:224.38ms step:2994/6710 train_time:671807ms step_avg:224.38ms step:2995/6710 train_time:672038ms step_avg:224.39ms step:2996/6710 train_time:672271ms step_avg:224.39ms step:2997/6710 train_time:672500ms step_avg:224.39ms step:2998/6710 train_time:672731ms step_avg:224.39ms step:2999/6710 train_time:672963ms step_avg:224.40ms step:3000/6710 train_time:673194ms step_avg:224.40ms step:3000/6710 val_loss:3.166784 train_time:673376ms step_avg:224.46ms Parameter containing: tensor([1.0000, 1.0000, 0.4123, 1.0000, 0.6179, 1.0000, 0.5264, 1.0000], device='cuda:0', requires_grad=True) 0 [6.970746040344238, 5.9707441329956055] 1 [0.5448155403137207, 5.961458683013916] 2 [0.814954936504364, 4.567664623260498] 3 [0.6848659515380859, 3.7199835777282715] 4 [0.33057036995887756, 2.6530556678771973] 5 [0.7653844952583313, 3.9721198081970215] 6 [0.5087154507637024, 3.1752686500549316] 7 [0.8212363719940186, 5.617356777191162] 8 [0.42508259415626526, 1.7364604473114014] 9 [0.4919072985649109, 2.6024093627929688] 10 [0.6658296585083008, 3.0574493408203125] 11 [0.4293621778488159, 3.1252927780151367] 12 [0.97280353307724, 5.925477027893066] 13 [1.0810356140136719, 3.555206060409546] 14 [0.9776486754417419, 2.098963737487793] 15 [0.8091087937355042, 1.4197382926940918] 0 [12.931502342224121, 26.60266876220703, 29.373048782348633] 1 [30.447525024414062, 27.740943908691406, 68.60820007324219] 2 [76.09908294677734, 23.915021896362305, 31.12477684020996] 3 [68.92239379882812, 30.279939651489258, 35.98884201049805] 4 [34.2305908203125, 27.112743377685547, 26.3186092376709] 5 [51.78109359741211, 26.385406494140625, 39.35645294189453] 6 [45.97882843017578, 29.819210052490234, 28.350553512573242] 7 [66.35801696777344, 0.0, 47.68349075317383] 8 [40.9138069152832, 31.906078338623047, 47.30638122558594] 9 [61.462425231933594, 27.534048080444336, 36.78171157836914] 10 [84.7309341430664, 26.369834899902344, 35.25509262084961] 11 [62.88957977294922, 33.484920501708984, 19.415340423583984] 12 [94.2196273803711, 25.073322296142578, 22.38087272644043] 13 [129.03372192382812, 22.292085647583008, 29.55182647705078] 14 [143.61526489257812, 27.158458709716797, 43.323631286621094] 15 [135.545654296875, 89.28814697265625, 139.41758728027344] step:3001/6710 train_time:673426ms step_avg:224.40ms step:3002/6710 train_time:673653ms step_avg:224.40ms step:3003/6710 train_time:673889ms step_avg:224.41ms step:3004/6710 train_time:674120ms step_avg:224.41ms step:3005/6710 train_time:674352ms step_avg:224.41ms step:3006/6710 train_time:674583ms step_avg:224.41ms step:3007/6710 train_time:674814ms step_avg:224.41ms step:3008/6710 train_time:675046ms step_avg:224.42ms step:3009/6710 train_time:675279ms step_avg:224.42ms step:3010/6710 train_time:675510ms step_avg:224.42ms step:3011/6710 train_time:675742ms step_avg:224.42ms step:3012/6710 train_time:675973ms step_avg:224.43ms step:3013/6710 train_time:676205ms step_avg:224.43ms step:3014/6710 train_time:676436ms step_avg:224.43ms step:3015/6710 train_time:676665ms step_avg:224.43ms step:3016/6710 train_time:676898ms step_avg:224.44ms step:3017/6710 train_time:677129ms step_avg:224.44ms step:3018/6710 train_time:677359ms step_avg:224.44ms step:3019/6710 train_time:677589ms step_avg:224.44ms step:3020/6710 train_time:677822ms step_avg:224.44ms step:3021/6710 train_time:678051ms step_avg:224.45ms step:3022/6710 train_time:678282ms step_avg:224.45ms step:3023/6710 train_time:678513ms step_avg:224.45ms step:3024/6710 train_time:678746ms step_avg:224.45ms step:3025/6710 train_time:678977ms step_avg:224.46ms step:3026/6710 train_time:679207ms step_avg:224.46ms step:3027/6710 train_time:679437ms step_avg:224.46ms step:3028/6710 train_time:679667ms step_avg:224.46ms step:3029/6710 train_time:679900ms step_avg:224.46ms step:3030/6710 train_time:680131ms step_avg:224.47ms step:3031/6710 train_time:680362ms step_avg:224.47ms step:3032/6710 train_time:680594ms step_avg:224.47ms step:3033/6710 train_time:680825ms step_avg:224.47ms step:3034/6710 train_time:681059ms step_avg:224.48ms step:3035/6710 train_time:681289ms step_avg:224.48ms step:3036/6710 train_time:681520ms step_avg:224.48ms step:3037/6710 train_time:681752ms step_avg:224.48ms step:3038/6710 train_time:681983ms step_avg:224.48ms step:3039/6710 train_time:682215ms step_avg:224.49ms step:3040/6710 train_time:682448ms step_avg:224.49ms step:3041/6710 train_time:682678ms step_avg:224.49ms step:3042/6710 train_time:682907ms step_avg:224.49ms step:3043/6710 train_time:683140ms step_avg:224.50ms step:3044/6710 train_time:683370ms step_avg:224.50ms step:3045/6710 train_time:683602ms step_avg:224.50ms step:3046/6710 train_time:683832ms step_avg:224.50ms step:3047/6710 train_time:684064ms step_avg:224.50ms step:3048/6710 train_time:684294ms step_avg:224.51ms step:3049/6710 train_time:684526ms step_avg:224.51ms step:3050/6710 train_time:684757ms step_avg:224.51ms step:3051/6710 train_time:684990ms step_avg:224.51ms step:3052/6710 train_time:685222ms step_avg:224.52ms step:3053/6710 train_time:685455ms step_avg:224.52ms step:3054/6710 train_time:685684ms step_avg:224.52ms step:3055/6710 train_time:685918ms step_avg:224.52ms step:3056/6710 train_time:686148ms step_avg:224.53ms step:3057/6710 train_time:686381ms step_avg:224.53ms step:3058/6710 train_time:686611ms step_avg:224.53ms step:3059/6710 train_time:686843ms step_avg:224.53ms step:3060/6710 train_time:687075ms step_avg:224.53ms step:3061/6710 train_time:687307ms step_avg:224.54ms step:3062/6710 train_time:687539ms step_avg:224.54ms step:3063/6710 train_time:687767ms step_avg:224.54ms step:3064/6710 train_time:687998ms step_avg:224.54ms step:3065/6710 train_time:688229ms step_avg:224.54ms step:3066/6710 train_time:688461ms step_avg:224.55ms step:3067/6710 train_time:688691ms step_avg:224.55ms step:3068/6710 train_time:688922ms step_avg:224.55ms step:3069/6710 train_time:689154ms step_avg:224.55ms step:3070/6710 train_time:689385ms step_avg:224.56ms step:3071/6710 train_time:689615ms step_avg:224.56ms step:3072/6710 train_time:689846ms step_avg:224.56ms step:3073/6710 train_time:690078ms step_avg:224.56ms step:3074/6710 train_time:690309ms step_avg:224.56ms step:3075/6710 train_time:690541ms step_avg:224.57ms step:3076/6710 train_time:690771ms step_avg:224.57ms step:3077/6710 train_time:691001ms step_avg:224.57ms step:3078/6710 train_time:691232ms step_avg:224.57ms step:3079/6710 train_time:691464ms step_avg:224.57ms step:3080/6710 train_time:691695ms step_avg:224.58ms step:3081/6710 train_time:691926ms step_avg:224.58ms step:3082/6710 train_time:692159ms step_avg:224.58ms step:3083/6710 train_time:692391ms step_avg:224.58ms step:3084/6710 train_time:692622ms step_avg:224.59ms step:3085/6710 train_time:692853ms step_avg:224.59ms step:3086/6710 train_time:693085ms step_avg:224.59ms step:3087/6710 train_time:693316ms step_avg:224.59ms step:3088/6710 train_time:693546ms step_avg:224.59ms step:3089/6710 train_time:693777ms step_avg:224.60ms step:3090/6710 train_time:694010ms step_avg:224.60ms step:3091/6710 train_time:694242ms step_avg:224.60ms step:3092/6710 train_time:694474ms step_avg:224.60ms step:3093/6710 train_time:694703ms step_avg:224.61ms step:3094/6710 train_time:694935ms step_avg:224.61ms step:3095/6710 train_time:695166ms step_avg:224.61ms step:3096/6710 train_time:695399ms step_avg:224.61ms step:3097/6710 train_time:695629ms step_avg:224.61ms step:3098/6710 train_time:695861ms step_avg:224.62ms step:3099/6710 train_time:696094ms step_avg:224.62ms step:3100/6710 train_time:696326ms step_avg:224.62ms step:3101/6710 train_time:696558ms step_avg:224.62ms step:3102/6710 train_time:696788ms step_avg:224.63ms step:3103/6710 train_time:697020ms step_avg:224.63ms step:3104/6710 train_time:697251ms step_avg:224.63ms step:3105/6710 train_time:697483ms step_avg:224.63ms step:3106/6710 train_time:697715ms step_avg:224.63ms step:3107/6710 train_time:697946ms step_avg:224.64ms step:3108/6710 train_time:698178ms step_avg:224.64ms step:3109/6710 train_time:698410ms step_avg:224.64ms step:3110/6710 train_time:698642ms step_avg:224.64ms step:3111/6710 train_time:698873ms step_avg:224.65ms step:3112/6710 train_time:699104ms step_avg:224.65ms step:3113/6710 train_time:699335ms step_avg:224.65ms step:3114/6710 train_time:699566ms step_avg:224.65ms step:3115/6710 train_time:699797ms step_avg:224.65ms step:3116/6710 train_time:700028ms step_avg:224.66ms step:3117/6710 train_time:700260ms step_avg:224.66ms step:3118/6710 train_time:700491ms step_avg:224.66ms step:3119/6710 train_time:700723ms step_avg:224.66ms step:3120/6710 train_time:700954ms step_avg:224.66ms step:3121/6710 train_time:701187ms step_avg:224.67ms step:3122/6710 train_time:701418ms step_avg:224.67ms step:3123/6710 train_time:701650ms step_avg:224.67ms step:3124/6710 train_time:701881ms step_avg:224.67ms step:3125/6710 train_time:702112ms step_avg:224.68ms step:3125/6710 val_loss:3.154400 train_time:702294ms step_avg:224.73ms Parameter containing: tensor([1.0000, 1.0000, 0.4189, 1.0000, 0.5983, 1.0000, 0.5220, 1.0000], device='cuda:0', requires_grad=True) 0 [7.1031293869018555, 6.103127479553223] 1 [0.5451364517211914, 6.0879034996032715] 2 [0.8077169060707092, 4.635031700134277] 3 [0.6860005855560303, 3.7761390209198] 4 [0.336839884519577, 2.6790707111358643] 5 [0.7595824003219604, 4.017038345336914] 6 [0.5071157217025757, 3.196723699569702] 7 [0.7995939254760742, 5.705867767333984] 8 [0.4368089735507965, 1.7050957679748535] 9 [0.49011924862861633, 2.5947976112365723] 10 [0.6574623584747314, 3.0329535007476807] 11 [0.43204179406166077, 3.1184568405151367] 12 [0.9751169681549072, 6.005561828613281] 13 [1.0760523080825806, 3.5739948749542236] 14 [0.9721517562866211, 2.023336172103882] 15 [0.8064431548118591, 1.296398401260376] 0 [13.19751262664795, 26.780920028686523, 30.1543025970459] 1 [30.983762741088867, 27.99808692932129, 69.59272766113281] 2 [76.44094848632812, 24.198850631713867, 31.43442153930664] 3 [69.4999771118164, 30.65825653076172, 36.6123161315918] 4 [35.24226760864258, 27.710927963256836, 27.092741012573242] 5 [52.71549987792969, 26.90275001525879, 39.446311950683594] 6 [46.41279602050781, 30.24469566345215, 28.579927444458008] 7 [65.26773071289062, 0.0, 48.34232711791992] 8 [41.791988372802734, 32.165618896484375, 47.58149719238281] 9 [61.672515869140625, 27.731521606445312, 37.53411865234375] 10 [83.92777252197266, 26.927377700805664, 35.75004959106445] 11 [63.33982467651367, 34.09993362426758, 19.777294158935547] 12 [95.44278717041016, 25.603191375732422, 22.686399459838867] 13 [130.18405151367188, 22.47907257080078, 29.876182556152344] 14 [144.1458282470703, 27.023351669311523, 43.200618743896484] 15 [135.6385955810547, 90.43730163574219, 139.72601318359375] step:3126/6710 train_time:702343ms step_avg:224.68ms step:3127/6710 train_time:702655ms step_avg:224.71ms step:3128/6710 train_time:702883ms step_avg:224.71ms step:3129/6710 train_time:703111ms step_avg:224.71ms step:3130/6710 train_time:703339ms step_avg:224.71ms step:3131/6710 train_time:703582ms step_avg:224.71ms step:3132/6710 train_time:703814ms step_avg:224.72ms step:3133/6710 train_time:704043ms step_avg:224.72ms step:3134/6710 train_time:704272ms step_avg:224.72ms step:3135/6710 train_time:704507ms step_avg:224.72ms step:3136/6710 train_time:704739ms step_avg:224.73ms step:3137/6710 train_time:704970ms step_avg:224.73ms step:3138/6710 train_time:705200ms step_avg:224.73ms step:3139/6710 train_time:705430ms step_avg:224.73ms step:3140/6710 train_time:705665ms step_avg:224.73ms step:3141/6710 train_time:705895ms step_avg:224.74ms step:3142/6710 train_time:706125ms step_avg:224.74ms step:3143/6710 train_time:706357ms step_avg:224.74ms step:3144/6710 train_time:706590ms step_avg:224.74ms step:3145/6710 train_time:706821ms step_avg:224.74ms step:3146/6710 train_time:707051ms step_avg:224.75ms step:3147/6710 train_time:707283ms step_avg:224.75ms step:3148/6710 train_time:707512ms step_avg:224.75ms step:3149/6710 train_time:707745ms step_avg:224.75ms step:3150/6710 train_time:707976ms step_avg:224.75ms step:3151/6710 train_time:708207ms step_avg:224.76ms step:3152/6710 train_time:708438ms step_avg:224.76ms step:3153/6710 train_time:708670ms step_avg:224.76ms step:3154/6710 train_time:708903ms step_avg:224.76ms step:3155/6710 train_time:709133ms step_avg:224.76ms step:3156/6710 train_time:709364ms step_avg:224.77ms step:3157/6710 train_time:709597ms step_avg:224.77ms step:3158/6710 train_time:709828ms step_avg:224.77ms step:3159/6710 train_time:710059ms step_avg:224.77ms step:3160/6710 train_time:710289ms step_avg:224.77ms step:3161/6710 train_time:710521ms step_avg:224.78ms step:3162/6710 train_time:710751ms step_avg:224.78ms step:3163/6710 train_time:710981ms step_avg:224.78ms step:3164/6710 train_time:711215ms step_avg:224.78ms step:3165/6710 train_time:711446ms step_avg:224.79ms step:3166/6710 train_time:711677ms step_avg:224.79ms step:3167/6710 train_time:711908ms step_avg:224.79ms step:3168/6710 train_time:712140ms step_avg:224.79ms step:3169/6710 train_time:712372ms step_avg:224.79ms step:3170/6710 train_time:712603ms step_avg:224.80ms step:3171/6710 train_time:712835ms step_avg:224.80ms step:3172/6710 train_time:713067ms step_avg:224.80ms step:3173/6710 train_time:713298ms step_avg:224.80ms step:3174/6710 train_time:713529ms step_avg:224.80ms step:3175/6710 train_time:713761ms step_avg:224.81ms step:3176/6710 train_time:713991ms step_avg:224.81ms step:3177/6710 train_time:714222ms step_avg:224.81ms step:3178/6710 train_time:714452ms step_avg:224.81ms step:3179/6710 train_time:714683ms step_avg:224.81ms step:3180/6710 train_time:714913ms step_avg:224.82ms step:3181/6710 train_time:715146ms step_avg:224.82ms step:3182/6710 train_time:715376ms step_avg:224.82ms step:3183/6710 train_time:715608ms step_avg:224.82ms step:3184/6710 train_time:715840ms step_avg:224.82ms step:3185/6710 train_time:716072ms step_avg:224.83ms step:3186/6710 train_time:716303ms step_avg:224.83ms step:3187/6710 train_time:716533ms step_avg:224.83ms step:3188/6710 train_time:716763ms step_avg:224.83ms step:3189/6710 train_time:716995ms step_avg:224.83ms step:3190/6710 train_time:717226ms step_avg:224.84ms step:3191/6710 train_time:717457ms step_avg:224.84ms step:3192/6710 train_time:717688ms step_avg:224.84ms step:3193/6710 train_time:717919ms step_avg:224.84ms step:3194/6710 train_time:718149ms step_avg:224.84ms step:3195/6710 train_time:718383ms step_avg:224.85ms step:3196/6710 train_time:718613ms step_avg:224.85ms step:3197/6710 train_time:718845ms step_avg:224.85ms step:3198/6710 train_time:719075ms step_avg:224.85ms step:3199/6710 train_time:719306ms step_avg:224.85ms step:3200/6710 train_time:719538ms step_avg:224.86ms step:3201/6710 train_time:719769ms step_avg:224.86ms step:3202/6710 train_time:720000ms step_avg:224.86ms step:3203/6710 train_time:720232ms step_avg:224.86ms step:3204/6710 train_time:720464ms step_avg:224.86ms step:3205/6710 train_time:720694ms step_avg:224.87ms step:3206/6710 train_time:720926ms step_avg:224.87ms step:3207/6710 train_time:721157ms step_avg:224.87ms step:3208/6710 train_time:721388ms step_avg:224.87ms step:3209/6710 train_time:721620ms step_avg:224.87ms step:3210/6710 train_time:721850ms step_avg:224.88ms step:3211/6710 train_time:722083ms step_avg:224.88ms step:3212/6710 train_time:722314ms step_avg:224.88ms step:3213/6710 train_time:722547ms step_avg:224.88ms step:3214/6710 train_time:722778ms step_avg:224.88ms step:3215/6710 train_time:723009ms step_avg:224.89ms step:3216/6710 train_time:723238ms step_avg:224.89ms step:3217/6710 train_time:723471ms step_avg:224.89ms step:3218/6710 train_time:723703ms step_avg:224.89ms step:3219/6710 train_time:723934ms step_avg:224.89ms step:3220/6710 train_time:724166ms step_avg:224.90ms step:3221/6710 train_time:724395ms step_avg:224.90ms step:3222/6710 train_time:724626ms step_avg:224.90ms step:3223/6710 train_time:724858ms step_avg:224.90ms step:3224/6710 train_time:725089ms step_avg:224.90ms step:3225/6710 train_time:725322ms step_avg:224.91ms step:3226/6710 train_time:725552ms step_avg:224.91ms step:3227/6710 train_time:725782ms step_avg:224.91ms step:3228/6710 train_time:726012ms step_avg:224.91ms step:3229/6710 train_time:726244ms step_avg:224.91ms step:3230/6710 train_time:726478ms step_avg:224.92ms step:3231/6710 train_time:726709ms step_avg:224.92ms step:3232/6710 train_time:726940ms step_avg:224.92ms step:3233/6710 train_time:727170ms step_avg:224.92ms step:3234/6710 train_time:727403ms step_avg:224.92ms step:3235/6710 train_time:727634ms step_avg:224.93ms step:3236/6710 train_time:727866ms step_avg:224.93ms step:3237/6710 train_time:728098ms step_avg:224.93ms step:3238/6710 train_time:728330ms step_avg:224.93ms step:3239/6710 train_time:728561ms step_avg:224.93ms step:3240/6710 train_time:728792ms step_avg:224.94ms step:3241/6710 train_time:729023ms step_avg:224.94ms step:3242/6710 train_time:729255ms step_avg:224.94ms step:3243/6710 train_time:729487ms step_avg:224.94ms step:3244/6710 train_time:729718ms step_avg:224.94ms step:3245/6710 train_time:729948ms step_avg:224.95ms step:3246/6710 train_time:730180ms step_avg:224.95ms step:3247/6710 train_time:730411ms step_avg:224.95ms step:3248/6710 train_time:730641ms step_avg:224.95ms step:3249/6710 train_time:730873ms step_avg:224.95ms step:3250/6710 train_time:731103ms step_avg:224.95ms step:3250/6710 val_loss:3.141666 train_time:731286ms step_avg:225.01ms Parameter containing: tensor([1.0000, 1.0000, 0.4080, 1.0000, 0.5969, 1.0000, 0.5060, 1.0000], device='cuda:0', requires_grad=True) 0 [7.229988098144531, 6.229986190795898] 1 [0.5332391262054443, 6.200290203094482] 2 [0.798800528049469, 4.658230304718018] 3 [0.6906586289405823, 3.8080146312713623] 4 [0.3383459746837616, 2.7027571201324463] 5 [0.7518501877784729, 4.0105299949646] 6 [0.5029247999191284, 3.1799213886260986] 7 [0.7913029789924622, 5.768707275390625] 8 [0.43706944584846497, 1.6462591886520386] 9 [0.4899386167526245, 2.577455759048462] 10 [0.65777987241745, 3.0387022495269775] 11 [0.4283484220504761, 3.1463849544525146] 12 [0.9638110995292664, 6.102240562438965] 13 [1.0752345323562622, 3.6151974201202393] 14 [0.9737532138824463, 1.9915835857391357] 15 [0.8146663904190063, 1.2120434045791626] 0 [13.451679229736328, 26.96352767944336, 30.328054428100586] 1 [30.6747989654541, 28.420368194580078, 67.74642944335938] 2 [74.39274597167969, 24.18399429321289, 31.672508239746094] 3 [68.8687515258789, 30.962182998657227, 36.568424224853516] 4 [35.21794509887695, 27.845325469970703, 27.550615310668945] 5 [52.38083267211914, 27.119443893432617, 39.65043258666992] 6 [45.87765121459961, 30.40192985534668, 29.071683883666992] 7 [64.43746948242188, 0.0, 48.08747863769531] 8 [41.412567138671875, 32.248779296875, 47.53995895385742] 9 [60.765716552734375, 27.868818283081055, 37.632144927978516] 10 [83.29508209228516, 27.127609252929688, 36.20928955078125] 11 [62.20193862915039, 34.17485046386719, 19.966989517211914] 12 [93.50556945800781, 25.879276275634766, 22.700586318969727] 13 [128.2462158203125, 22.331729888916016, 29.742172241210938] 14 [142.33570861816406, 27.030824661254883, 42.82261657714844] 15 [135.38450622558594, 90.84608459472656, 141.03765869140625] step:3251/6710 train_time:731336ms step_avg:224.96ms step:3252/6710 train_time:731564ms step_avg:224.96ms step:3253/6710 train_time:731802ms step_avg:224.96ms step:3254/6710 train_time:732033ms step_avg:224.96ms step:3255/6710 train_time:732263ms step_avg:224.97ms step:3256/6710 train_time:732493ms step_avg:224.97ms step:3257/6710 train_time:732727ms step_avg:224.97ms step:3258/6710 train_time:732958ms step_avg:224.97ms step:3259/6710 train_time:733188ms step_avg:224.97ms step:3260/6710 train_time:733416ms step_avg:224.97ms step:3261/6710 train_time:733648ms step_avg:224.98ms step:3262/6710 train_time:733880ms step_avg:224.98ms step:3263/6710 train_time:734110ms step_avg:224.98ms step:3264/6710 train_time:734341ms step_avg:224.98ms step:3265/6710 train_time:734572ms step_avg:224.98ms step:3266/6710 train_time:734804ms step_avg:224.99ms step:3267/6710 train_time:735036ms step_avg:224.99ms step:3268/6710 train_time:735268ms step_avg:224.99ms step:3269/6710 train_time:735500ms step_avg:224.99ms step:3270/6710 train_time:735731ms step_avg:224.99ms step:3271/6710 train_time:735964ms step_avg:225.00ms step:3272/6710 train_time:736194ms step_avg:225.00ms step:3273/6710 train_time:736425ms step_avg:225.00ms step:3274/6710 train_time:736657ms step_avg:225.00ms step:3275/6710 train_time:736889ms step_avg:225.00ms step:3276/6710 train_time:737119ms step_avg:225.01ms step:3277/6710 train_time:737351ms step_avg:225.01ms step:3278/6710 train_time:737584ms step_avg:225.01ms step:3279/6710 train_time:737815ms step_avg:225.01ms step:3280/6710 train_time:738047ms step_avg:225.01ms step:3281/6710 train_time:738278ms step_avg:225.02ms step:3282/6710 train_time:738508ms step_avg:225.02ms step:3283/6710 train_time:738739ms step_avg:225.02ms step:3284/6710 train_time:738971ms step_avg:225.02ms step:3285/6710 train_time:739202ms step_avg:225.02ms step:3286/6710 train_time:739433ms step_avg:225.03ms step:3287/6710 train_time:739664ms step_avg:225.03ms step:3288/6710 train_time:739895ms step_avg:225.03ms step:3289/6710 train_time:740126ms step_avg:225.03ms step:3290/6710 train_time:740357ms step_avg:225.03ms step:3291/6710 train_time:740589ms step_avg:225.03ms step:3292/6710 train_time:740820ms step_avg:225.04ms step:3293/6710 train_time:741053ms step_avg:225.04ms step:3294/6710 train_time:741285ms step_avg:225.04ms step:3295/6710 train_time:741515ms step_avg:225.04ms step:3296/6710 train_time:741747ms step_avg:225.04ms step:3297/6710 train_time:741977ms step_avg:225.05ms step:3298/6710 train_time:742209ms step_avg:225.05ms step:3299/6710 train_time:742440ms step_avg:225.05ms step:3300/6710 train_time:742670ms step_avg:225.05ms step:3301/6710 train_time:742902ms step_avg:225.05ms step:3302/6710 train_time:743133ms step_avg:225.06ms step:3303/6710 train_time:743365ms step_avg:225.06ms step:3304/6710 train_time:743595ms step_avg:225.06ms step:3305/6710 train_time:743827ms step_avg:225.06ms step:3306/6710 train_time:744057ms step_avg:225.06ms step:3307/6710 train_time:744289ms step_avg:225.06ms step:3308/6710 train_time:744519ms step_avg:225.07ms step:3309/6710 train_time:744751ms step_avg:225.07ms step:3310/6710 train_time:744981ms step_avg:225.07ms step:3311/6710 train_time:745212ms step_avg:225.07ms step:3312/6710 train_time:745444ms step_avg:225.07ms step:3313/6710 train_time:745676ms step_avg:225.08ms step:3314/6710 train_time:745907ms step_avg:225.08ms step:3315/6710 train_time:746137ms step_avg:225.08ms step:3316/6710 train_time:746369ms step_avg:225.08ms step:3317/6710 train_time:746600ms step_avg:225.08ms step:3318/6710 train_time:746831ms step_avg:225.08ms step:3319/6710 train_time:747062ms step_avg:225.09ms step:3320/6710 train_time:747294ms step_avg:225.09ms step:3321/6710 train_time:747526ms step_avg:225.09ms step:3322/6710 train_time:747756ms step_avg:225.09ms step:3323/6710 train_time:747988ms step_avg:225.09ms step:3324/6710 train_time:748218ms step_avg:225.10ms step:3325/6710 train_time:748450ms step_avg:225.10ms step:3326/6710 train_time:748680ms step_avg:225.10ms step:3327/6710 train_time:748912ms step_avg:225.10ms step:3328/6710 train_time:749142ms step_avg:225.10ms step:3329/6710 train_time:749374ms step_avg:225.10ms step:3330/6710 train_time:749606ms step_avg:225.11ms step:3331/6710 train_time:749837ms step_avg:225.11ms step:3332/6710 train_time:750068ms step_avg:225.11ms step:3333/6710 train_time:750297ms step_avg:225.11ms step:3334/6710 train_time:750530ms step_avg:225.11ms step:3335/6710 train_time:750760ms step_avg:225.12ms step:3336/6710 train_time:750992ms step_avg:225.12ms step:3337/6710 train_time:751222ms step_avg:225.12ms step:3338/6710 train_time:751455ms step_avg:225.12ms step:3339/6710 train_time:751686ms step_avg:225.12ms step:3340/6710 train_time:751916ms step_avg:225.12ms step:3341/6710 train_time:752148ms step_avg:225.13ms step:3342/6710 train_time:752380ms step_avg:225.13ms step:3343/6710 train_time:752612ms step_avg:225.13ms step:3344/6710 train_time:752842ms step_avg:225.13ms step:3345/6710 train_time:753073ms step_avg:225.13ms step:3346/6710 train_time:753303ms step_avg:225.14ms step:3347/6710 train_time:753535ms step_avg:225.14ms step:3348/6710 train_time:753767ms step_avg:225.14ms step:3349/6710 train_time:753998ms step_avg:225.14ms step:3350/6710 train_time:754230ms step_avg:225.14ms step:3351/6710 train_time:754460ms step_avg:225.14ms step:3352/6710 train_time:754691ms step_avg:225.15ms step:3353/6710 train_time:754924ms step_avg:225.15ms step:3354/6710 train_time:755156ms step_avg:225.15ms step:3355/6710 train_time:755387ms step_avg:225.15ms step:3356/6710 train_time:755617ms step_avg:225.15ms step:3357/6710 train_time:755849ms step_avg:225.16ms step:3358/6710 train_time:756080ms step_avg:225.16ms step:3359/6710 train_time:756312ms step_avg:225.16ms step:3360/6710 train_time:756543ms step_avg:225.16ms step:3361/6710 train_time:756776ms step_avg:225.16ms step:3362/6710 train_time:757009ms step_avg:225.17ms step:3363/6710 train_time:757240ms step_avg:225.17ms step:3364/6710 train_time:757472ms step_avg:225.17ms step:3365/6710 train_time:757703ms step_avg:225.17ms step:3366/6710 train_time:757935ms step_avg:225.17ms step:3367/6710 train_time:758166ms step_avg:225.18ms step:3368/6710 train_time:758396ms step_avg:225.18ms step:3369/6710 train_time:758628ms step_avg:225.18ms step:3370/6710 train_time:758860ms step_avg:225.18ms step:3371/6710 train_time:759092ms step_avg:225.18ms step:3372/6710 train_time:759324ms step_avg:225.19ms step:3373/6710 train_time:759555ms step_avg:225.19ms step:3374/6710 train_time:759786ms step_avg:225.19ms step:3375/6710 train_time:760018ms step_avg:225.19ms step:3375/6710 val_loss:3.131315 train_time:760199ms step_avg:225.24ms Parameter containing: tensor([1.0000, 1.0000, 0.4191, 1.0000, 0.6000, 1.0000, 0.5008, 1.0000], device='cuda:0', requires_grad=True) 0 [7.323026657104492, 6.323024749755859] 1 [0.5292164087295532, 6.268229007720947] 2 [0.7865590453147888, 4.663209915161133] 3 [0.6895517110824585, 3.831717014312744] 4 [0.34159672260284424, 2.722752094268799] 5 [0.7460484504699707, 3.995820999145508] 6 [0.5062918066978455, 3.1357157230377197] 7 [0.7804322242736816, 5.756446361541748] 8 [0.4371863901615143, 1.5476977825164795] 9 [0.48828786611557007, 2.5234858989715576] 10 [0.6572701334953308, 3.016080379486084] 11 [0.4301551878452301, 3.102759599685669] 12 [0.9598251581192017, 6.1417059898376465] 13 [1.0671504735946655, 3.5759379863739014] 14 [0.9714495539665222, 1.899660348892212] 15 [0.8173044323921204, 1.1002956628799438] 0 [13.639691352844238, 27.007160186767578, 30.78859519958496] 1 [30.679019927978516, 28.557924270629883, 69.90226745605469] 2 [74.732421875, 24.139434814453125, 31.54386329650879] 3 [68.74687194824219, 30.973552703857422, 36.961063385009766] 4 [35.54399871826172, 27.787099838256836, 27.96329116821289] 5 [52.236351013183594, 27.25041389465332, 40.484127044677734] 6 [46.37587356567383, 30.60716438293457, 29.609825134277344] 7 [64.13199615478516, 0.0, 47.9726676940918] 8 [41.250545501708984, 32.50614547729492, 47.67972183227539] 9 [60.469688415527344, 27.909759521484375, 37.488468170166016] 10 [82.92333984375, 27.352312088012695, 36.4520149230957] 11 [62.60371017456055, 34.34087371826172, 20.527061462402344] 12 [93.7215805053711, 26.032859802246094, 23.197813034057617] 13 [127.73301696777344, 22.093050003051758, 30.117733001708984] 14 [141.75515747070312, 26.717317581176758, 43.032649993896484] 15 [135.50242614746094, 90.25901794433594, 146.8444061279297] step:3376/6710 train_time:760249ms step_avg:225.19ms step:3377/6710 train_time:760478ms step_avg:225.19ms step:3378/6710 train_time:760718ms step_avg:225.20ms step:3379/6710 train_time:760948ms step_avg:225.20ms step:3380/6710 train_time:761177ms step_avg:225.20ms step:3381/6710 train_time:761408ms step_avg:225.20ms step:3382/6710 train_time:761643ms step_avg:225.20ms step:3383/6710 train_time:761873ms step_avg:225.21ms step:3384/6710 train_time:762103ms step_avg:225.21ms step:3385/6710 train_time:762333ms step_avg:225.21ms step:3386/6710 train_time:762566ms step_avg:225.21ms step:3387/6710 train_time:762797ms step_avg:225.21ms step:3388/6710 train_time:763027ms step_avg:225.21ms step:3389/6710 train_time:763256ms step_avg:225.22ms step:3390/6710 train_time:763486ms step_avg:225.22ms step:3391/6710 train_time:763719ms step_avg:225.22ms step:3392/6710 train_time:763951ms step_avg:225.22ms step:3393/6710 train_time:764181ms step_avg:225.22ms step:3394/6710 train_time:764412ms step_avg:225.22ms step:3395/6710 train_time:764644ms step_avg:225.23ms step:3396/6710 train_time:764875ms step_avg:225.23ms step:3397/6710 train_time:765105ms step_avg:225.23ms step:3398/6710 train_time:765335ms step_avg:225.23ms step:3399/6710 train_time:765567ms step_avg:225.23ms step:3400/6710 train_time:765799ms step_avg:225.24ms step:3401/6710 train_time:766031ms step_avg:225.24ms step:3402/6710 train_time:766263ms step_avg:225.24ms step:3403/6710 train_time:766495ms step_avg:225.24ms step:3404/6710 train_time:766726ms step_avg:225.24ms step:3405/6710 train_time:766956ms step_avg:225.24ms step:3406/6710 train_time:767186ms step_avg:225.25ms step:3407/6710 train_time:767419ms step_avg:225.25ms step:3408/6710 train_time:767652ms step_avg:225.25ms step:3409/6710 train_time:767882ms step_avg:225.25ms step:3410/6710 train_time:768113ms step_avg:225.25ms step:3411/6710 train_time:768344ms step_avg:225.25ms step:3412/6710 train_time:768576ms step_avg:225.26ms step:3413/6710 train_time:768808ms step_avg:225.26ms step:3414/6710 train_time:769039ms step_avg:225.26ms step:3415/6710 train_time:769269ms step_avg:225.26ms step:3416/6710 train_time:769500ms step_avg:225.26ms step:3417/6710 train_time:769731ms step_avg:225.27ms step:3418/6710 train_time:769962ms step_avg:225.27ms step:3419/6710 train_time:770191ms step_avg:225.27ms step:3420/6710 train_time:770424ms step_avg:225.27ms step:3421/6710 train_time:770655ms step_avg:225.27ms step:3422/6710 train_time:770887ms step_avg:225.27ms step:3423/6710 train_time:771119ms step_avg:225.28ms step:3424/6710 train_time:771349ms step_avg:225.28ms step:3425/6710 train_time:771580ms step_avg:225.28ms step:3426/6710 train_time:771811ms step_avg:225.28ms step:3427/6710 train_time:772042ms step_avg:225.28ms step:3428/6710 train_time:772273ms step_avg:225.28ms step:3429/6710 train_time:772505ms step_avg:225.29ms step:3430/6710 train_time:772734ms step_avg:225.29ms step:3431/6710 train_time:772966ms step_avg:225.29ms step:3432/6710 train_time:773199ms step_avg:225.29ms step:3433/6710 train_time:773428ms step_avg:225.29ms step:3434/6710 train_time:773659ms step_avg:225.29ms step:3435/6710 train_time:773890ms step_avg:225.30ms step:3436/6710 train_time:774122ms step_avg:225.30ms step:3437/6710 train_time:774352ms step_avg:225.30ms step:3438/6710 train_time:774583ms step_avg:225.30ms step:3439/6710 train_time:774814ms step_avg:225.30ms step:3440/6710 train_time:775045ms step_avg:225.30ms step:3441/6710 train_time:775276ms step_avg:225.31ms step:3442/6710 train_time:775507ms step_avg:225.31ms step:3443/6710 train_time:775737ms step_avg:225.31ms step:3444/6710 train_time:775969ms step_avg:225.31ms step:3445/6710 train_time:776201ms step_avg:225.31ms step:3446/6710 train_time:776431ms step_avg:225.31ms step:3447/6710 train_time:776662ms step_avg:225.32ms step:3448/6710 train_time:776893ms step_avg:225.32ms step:3449/6710 train_time:777124ms step_avg:225.32ms step:3450/6710 train_time:777356ms step_avg:225.32ms step:3451/6710 train_time:777588ms step_avg:225.32ms step:3452/6710 train_time:777820ms step_avg:225.32ms step:3453/6710 train_time:778052ms step_avg:225.33ms step:3454/6710 train_time:778283ms step_avg:225.33ms step:3455/6710 train_time:778514ms step_avg:225.33ms step:3456/6710 train_time:778745ms step_avg:225.33ms step:3457/6710 train_time:778976ms step_avg:225.33ms step:3458/6710 train_time:779207ms step_avg:225.33ms step:3459/6710 train_time:779438ms step_avg:225.34ms step:3460/6710 train_time:779667ms step_avg:225.34ms step:3461/6710 train_time:779899ms step_avg:225.34ms step:3462/6710 train_time:780129ms step_avg:225.34ms step:3463/6710 train_time:780361ms step_avg:225.34ms step:3464/6710 train_time:780590ms step_avg:225.34ms step:3465/6710 train_time:780821ms step_avg:225.35ms step:3466/6710 train_time:781053ms step_avg:225.35ms step:3467/6710 train_time:781284ms step_avg:225.35ms step:3468/6710 train_time:781515ms step_avg:225.35ms step:3469/6710 train_time:781745ms step_avg:225.35ms step:3470/6710 train_time:781976ms step_avg:225.35ms step:3471/6710 train_time:782207ms step_avg:225.36ms step:3472/6710 train_time:782439ms step_avg:225.36ms step:3473/6710 train_time:782669ms step_avg:225.36ms step:3474/6710 train_time:782899ms step_avg:225.36ms step:3475/6710 train_time:783131ms step_avg:225.36ms step:3476/6710 train_time:783362ms step_avg:225.36ms step:3477/6710 train_time:783595ms step_avg:225.37ms step:3478/6710 train_time:783825ms step_avg:225.37ms step:3479/6710 train_time:784057ms step_avg:225.37ms step:3480/6710 train_time:784287ms step_avg:225.37ms step:3481/6710 train_time:784520ms step_avg:225.37ms step:3482/6710 train_time:784756ms step_avg:225.38ms step:3483/6710 train_time:784989ms step_avg:225.38ms step:3484/6710 train_time:785226ms step_avg:225.38ms step:3485/6710 train_time:785461ms step_avg:225.38ms step:3486/6710 train_time:785696ms step_avg:225.39ms step:3487/6710 train_time:785930ms step_avg:225.39ms step:3488/6710 train_time:786165ms step_avg:225.39ms step:3489/6710 train_time:786399ms step_avg:225.39ms step:3490/6710 train_time:786634ms step_avg:225.40ms step:3491/6710 train_time:786867ms step_avg:225.40ms step:3492/6710 train_time:787101ms step_avg:225.40ms step:3493/6710 train_time:787333ms step_avg:225.40ms step:3494/6710 train_time:787569ms step_avg:225.41ms step:3495/6710 train_time:787805ms step_avg:225.41ms step:3496/6710 train_time:788038ms step_avg:225.41ms step:3497/6710 train_time:788270ms step_avg:225.41ms step:3498/6710 train_time:788507ms step_avg:225.42ms step:3499/6710 train_time:788743ms step_avg:225.42ms step:3500/6710 train_time:788977ms step_avg:225.42ms step:3500/6710 val_loss:3.120313 train_time:789162ms step_avg:225.47ms Parameter containing: tensor([1.0000, 1.0000, 0.4127, 1.0000, 0.5763, 1.0000, 0.4882, 1.0000], device='cuda:0', requires_grad=True) 0 [7.392678737640381, 6.392676830291748] 1 [0.5255197286605835, 6.293041229248047] 2 [0.7772279381752014, 4.62827205657959] 3 [0.6823801398277283, 3.812230348587036] 4 [0.34968164563179016, 2.713965892791748] 5 [0.7277050614356995, 3.963045358657837] 6 [0.5083800554275513, 3.048393487930298] 7 [0.7790896892547607, 5.7270827293396] 8 [0.43733662366867065, 1.4513202905654907] 9 [0.48809874057769775, 2.476222515106201] 10 [0.6566529273986816, 2.98366379737854] 11 [0.43342968821525574, 3.083894729614258] 12 [0.9516753554344177, 6.180331707000732] 13 [1.0590585470199585, 3.5735936164855957] 14 [0.9715439677238464, 1.8491746187210083] 15 [0.8259719610214233, 1.0321593284606934] 0 [13.780743598937988, 27.112590789794922, 31.53762435913086] 1 [30.88115692138672, 28.52595329284668, 71.71121978759766] 2 [75.0363540649414, 23.906824111938477, 31.33451271057129] 3 [67.98888397216797, 30.786954879760742, 36.875003814697266] 4 [35.9697265625, 27.95625877380371, 27.83889389038086] 5 [51.227352142333984, 27.120800018310547, 40.154457092285156] 6 [45.8529167175293, 30.510908126831055, 29.12046241760254] 7 [63.1748161315918, 0.0, 47.49304962158203] 8 [40.663394927978516, 31.945173263549805, 47.46476745605469] 9 [59.21359634399414, 27.504850387573242, 37.460018157958984] 10 [81.0352554321289, 27.302175521850586, 36.38107681274414] 11 [61.946136474609375, 34.18116760253906, 20.528535842895508] 12 [92.1584243774414, 26.18553924560547, 23.139610290527344] 13 [125.19927978515625, 21.820276260375977, 29.834468841552734] 14 [139.096923828125, 26.667377471923828, 42.37102127075195] 15 [134.55862426757812, 89.22938537597656, 147.00701904296875] step:3501/6710 train_time:789212ms step_avg:225.42ms step:3502/6710 train_time:789443ms step_avg:225.43ms step:3503/6710 train_time:789682ms step_avg:225.43ms step:3504/6710 train_time:789915ms step_avg:225.43ms step:3505/6710 train_time:790152ms step_avg:225.44ms step:3506/6710 train_time:790387ms step_avg:225.44ms step:3507/6710 train_time:790623ms step_avg:225.44ms step:3508/6710 train_time:790857ms step_avg:225.44ms step:3509/6710 train_time:791091ms step_avg:225.45ms step:3510/6710 train_time:791325ms step_avg:225.45ms step:3511/6710 train_time:791560ms step_avg:225.45ms step:3512/6710 train_time:791794ms step_avg:225.45ms step:3513/6710 train_time:792028ms step_avg:225.46ms step:3514/6710 train_time:792262ms step_avg:225.46ms step:3515/6710 train_time:792496ms step_avg:225.46ms step:3516/6710 train_time:792731ms step_avg:225.46ms step:3517/6710 train_time:792964ms step_avg:225.47ms step:3518/6710 train_time:793197ms step_avg:225.47ms step:3519/6710 train_time:793432ms step_avg:225.47ms step:3520/6710 train_time:793667ms step_avg:225.47ms step:3521/6710 train_time:793903ms step_avg:225.48ms step:3522/6710 train_time:794137ms step_avg:225.48ms step:3523/6710 train_time:794370ms step_avg:225.48ms step:3524/6710 train_time:794605ms step_avg:225.48ms step:3525/6710 train_time:794840ms step_avg:225.49ms step:3526/6710 train_time:795074ms step_avg:225.49ms step:3527/6710 train_time:795308ms step_avg:225.49ms step:3528/6710 train_time:795542ms step_avg:225.49ms step:3529/6710 train_time:795778ms step_avg:225.50ms step:3530/6710 train_time:796013ms step_avg:225.50ms step:3531/6710 train_time:796247ms step_avg:225.50ms step:3532/6710 train_time:796481ms step_avg:225.50ms step:3533/6710 train_time:796718ms step_avg:225.51ms step:3534/6710 train_time:796952ms step_avg:225.51ms step:3535/6710 train_time:797186ms step_avg:225.51ms step:3536/6710 train_time:797419ms step_avg:225.51ms step:3537/6710 train_time:797655ms step_avg:225.52ms step:3538/6710 train_time:797888ms step_avg:225.52ms step:3539/6710 train_time:798122ms step_avg:225.52ms step:3540/6710 train_time:798356ms step_avg:225.52ms step:3541/6710 train_time:798590ms step_avg:225.53ms step:3542/6710 train_time:798825ms step_avg:225.53ms step:3543/6710 train_time:799059ms step_avg:225.53ms step:3544/6710 train_time:799294ms step_avg:225.53ms step:3545/6710 train_time:799530ms step_avg:225.54ms step:3546/6710 train_time:799764ms step_avg:225.54ms step:3547/6710 train_time:799999ms step_avg:225.54ms step:3548/6710 train_time:800233ms step_avg:225.54ms step:3549/6710 train_time:800466ms step_avg:225.55ms step:3550/6710 train_time:800702ms step_avg:225.55ms step:3551/6710 train_time:800939ms step_avg:225.55ms step:3552/6710 train_time:801173ms step_avg:225.56ms step:3553/6710 train_time:801408ms step_avg:225.56ms step:3554/6710 train_time:801642ms step_avg:225.56ms step:3555/6710 train_time:801878ms step_avg:225.56ms step:3556/6710 train_time:802113ms step_avg:225.57ms step:3557/6710 train_time:802348ms step_avg:225.57ms step:3558/6710 train_time:802586ms step_avg:225.57ms step:3559/6710 train_time:802820ms step_avg:225.57ms step:3560/6710 train_time:803054ms step_avg:225.58ms step:3561/6710 train_time:803288ms step_avg:225.58ms step:3562/6710 train_time:803523ms step_avg:225.58ms step:3563/6710 train_time:803757ms step_avg:225.58ms step:3564/6710 train_time:803991ms step_avg:225.59ms step:3565/6710 train_time:804224ms step_avg:225.59ms step:3566/6710 train_time:804458ms step_avg:225.59ms step:3567/6710 train_time:804692ms step_avg:225.59ms step:3568/6710 train_time:804925ms step_avg:225.60ms step:3569/6710 train_time:805160ms step_avg:225.60ms step:3570/6710 train_time:805394ms step_avg:225.60ms step:3571/6710 train_time:805629ms step_avg:225.60ms step:3572/6710 train_time:805864ms step_avg:225.61ms step:3573/6710 train_time:806098ms step_avg:225.61ms step:3574/6710 train_time:806334ms step_avg:225.61ms step:3575/6710 train_time:806568ms step_avg:225.61ms step:3576/6710 train_time:806803ms step_avg:225.62ms step:3577/6710 train_time:807037ms step_avg:225.62ms step:3578/6710 train_time:807271ms step_avg:225.62ms step:3579/6710 train_time:807509ms step_avg:225.62ms step:3580/6710 train_time:807743ms step_avg:225.63ms step:3581/6710 train_time:807979ms step_avg:225.63ms step:3582/6710 train_time:808215ms step_avg:225.63ms step:3583/6710 train_time:808451ms step_avg:225.64ms step:3584/6710 train_time:808686ms step_avg:225.64ms step:3585/6710 train_time:808921ms step_avg:225.64ms step:3586/6710 train_time:809154ms step_avg:225.64ms step:3587/6710 train_time:809389ms step_avg:225.65ms step:3588/6710 train_time:809624ms step_avg:225.65ms step:3589/6710 train_time:809857ms step_avg:225.65ms step:3590/6710 train_time:810093ms step_avg:225.65ms step:3591/6710 train_time:810327ms step_avg:225.65ms step:3592/6710 train_time:810561ms step_avg:225.66ms step:3593/6710 train_time:810795ms step_avg:225.66ms step:3594/6710 train_time:811030ms step_avg:225.66ms step:3595/6710 train_time:811265ms step_avg:225.66ms step:3596/6710 train_time:811501ms step_avg:225.67ms step:3597/6710 train_time:811734ms step_avg:225.67ms step:3598/6710 train_time:811970ms step_avg:225.67ms step:3599/6710 train_time:812205ms step_avg:225.68ms step:3600/6710 train_time:812439ms step_avg:225.68ms step:3601/6710 train_time:812674ms step_avg:225.68ms step:3602/6710 train_time:812911ms step_avg:225.68ms step:3603/6710 train_time:813144ms step_avg:225.69ms step:3604/6710 train_time:813377ms step_avg:225.69ms step:3605/6710 train_time:813612ms step_avg:225.69ms step:3606/6710 train_time:813847ms step_avg:225.69ms step:3607/6710 train_time:814082ms step_avg:225.69ms step:3608/6710 train_time:814314ms step_avg:225.70ms step:3609/6710 train_time:814549ms step_avg:225.70ms step:3610/6710 train_time:814784ms step_avg:225.70ms step:3611/6710 train_time:815018ms step_avg:225.70ms step:3612/6710 train_time:815251ms step_avg:225.71ms step:3613/6710 train_time:815485ms step_avg:225.71ms step:3614/6710 train_time:815720ms step_avg:225.71ms step:3615/6710 train_time:815954ms step_avg:225.71ms step:3616/6710 train_time:816190ms step_avg:225.72ms step:3617/6710 train_time:816424ms step_avg:225.72ms step:3618/6710 train_time:816658ms step_avg:225.72ms step:3619/6710 train_time:816890ms step_avg:225.72ms step:3620/6710 train_time:817126ms step_avg:225.73ms step:3621/6710 train_time:817363ms step_avg:225.73ms step:3622/6710 train_time:817597ms step_avg:225.73ms step:3623/6710 train_time:817832ms step_avg:225.73ms step:3624/6710 train_time:818065ms step_avg:225.74ms step:3625/6710 train_time:818303ms step_avg:225.74ms step:3625/6710 val_loss:3.110254 train_time:818490ms step_avg:225.79ms Parameter containing: tensor([1.0000, 1.0000, 0.4153, 1.0000, 0.5728, 1.0000, 0.4864, 1.0000], device='cuda:0', requires_grad=True) 0 [7.487590312957764, 6.487588405609131] 1 [0.5284538269042969, 6.354582786560059] 2 [0.7545259594917297, 4.637290954589844] 3 [0.6777597665786743, 3.8250744342803955] 4 [0.3523153066635132, 2.746516466140747] 5 [0.7182425856590271, 3.960019826889038] 6 [0.5057306289672852, 3.0013427734375] 7 [0.7654092311859131, 5.755405426025391] 8 [0.45249107480049133, 1.4073342084884644] 9 [0.4926925301551819, 2.434438943862915] 10 [0.6576120853424072, 2.972611665725708] 11 [0.43753713369369507, 3.0763158798217773] 12 [0.940873384475708, 6.200906753540039] 13 [1.0530884265899658, 3.561375379562378] 14 [0.9686746001243591, 1.7726590633392334] 15 [0.8291715383529663, 0.9093837141990662] 0 [13.968647956848145, 27.10942840576172, 31.518966674804688] 1 [31.05357551574707, 28.607248306274414, 71.00946807861328] 2 [72.57604217529297, 23.836992263793945, 31.391069412231445] 3 [66.10929107666016, 30.80803108215332, 36.71891403198242] 4 [35.68410873413086, 28.005189895629883, 28.684032440185547] 5 [50.884830474853516, 27.120927810668945, 40.11770248413086] 6 [45.45197677612305, 30.539344787597656, 29.42555046081543] 7 [61.93358612060547, 0.0, 46.53020477294922] 8 [41.186363220214844, 31.881927490234375, 46.95578384399414] 9 [59.597293853759766, 27.612361907958984, 37.71549987792969] 10 [81.40692901611328, 27.51346206665039, 36.40941619873047] 11 [62.46331787109375, 34.08310317993164, 20.744789123535156] 12 [91.71311950683594, 26.20195198059082, 23.055727005004883] 13 [123.90703582763672, 22.032201766967773, 29.524635314941406] 14 [137.2163543701172, 26.535362243652344, 41.43354034423828] 15 [133.1656951904297, 89.02098083496094, 144.53895568847656] step:3626/6710 train_time:818541ms step_avg:225.74ms step:3627/6710 train_time:818772ms step_avg:225.74ms step:3628/6710 train_time:819010ms step_avg:225.75ms step:3629/6710 train_time:819244ms step_avg:225.75ms step:3630/6710 train_time:819481ms step_avg:225.75ms step:3631/6710 train_time:819716ms step_avg:225.75ms step:3632/6710 train_time:819953ms step_avg:225.76ms step:3633/6710 train_time:820185ms step_avg:225.76ms step:3634/6710 train_time:820421ms step_avg:225.76ms step:3635/6710 train_time:820656ms step_avg:225.76ms step:3636/6710 train_time:820889ms step_avg:225.77ms step:3637/6710 train_time:821125ms step_avg:225.77ms step:3638/6710 train_time:821360ms step_avg:225.77ms step:3639/6710 train_time:821595ms step_avg:225.77ms step:3640/6710 train_time:821828ms step_avg:225.78ms step:3641/6710 train_time:822064ms step_avg:225.78ms step:3642/6710 train_time:822302ms step_avg:225.78ms step:3643/6710 train_time:822536ms step_avg:225.79ms step:3644/6710 train_time:822772ms step_avg:225.79ms step:3645/6710 train_time:823006ms step_avg:225.79ms step:3646/6710 train_time:823239ms step_avg:225.79ms step:3647/6710 train_time:823474ms step_avg:225.79ms step:3648/6710 train_time:823709ms step_avg:225.80ms step:3649/6710 train_time:823944ms step_avg:225.80ms step:3650/6710 train_time:824179ms step_avg:225.80ms step:3651/6710 train_time:824414ms step_avg:225.80ms step:3652/6710 train_time:824648ms step_avg:225.81ms step:3653/6710 train_time:824885ms step_avg:225.81ms step:3654/6710 train_time:825119ms step_avg:225.81ms step:3655/6710 train_time:825356ms step_avg:225.82ms step:3656/6710 train_time:825590ms step_avg:225.82ms step:3657/6710 train_time:825826ms step_avg:225.82ms step:3658/6710 train_time:826061ms step_avg:225.82ms step:3659/6710 train_time:826295ms step_avg:225.83ms step:3660/6710 train_time:826529ms step_avg:225.83ms step:3661/6710 train_time:826764ms step_avg:225.83ms step:3662/6710 train_time:826997ms step_avg:225.83ms step:3663/6710 train_time:827232ms step_avg:225.83ms step:3664/6710 train_time:827467ms step_avg:225.84ms step:3665/6710 train_time:827701ms step_avg:225.84ms step:3666/6710 train_time:827936ms step_avg:225.84ms step:3667/6710 train_time:828169ms step_avg:225.84ms step:3668/6710 train_time:828404ms step_avg:225.85ms step:3669/6710 train_time:828637ms step_avg:225.85ms step:3670/6710 train_time:828871ms step_avg:225.85ms step:3671/6710 train_time:829107ms step_avg:225.85ms step:3672/6710 train_time:829343ms step_avg:225.86ms step:3673/6710 train_time:829578ms step_avg:225.86ms step:3674/6710 train_time:829812ms step_avg:225.86ms step:3675/6710 train_time:830047ms step_avg:225.86ms step:3676/6710 train_time:830281ms step_avg:225.87ms step:3677/6710 train_time:830515ms step_avg:225.87ms step:3678/6710 train_time:830750ms step_avg:225.87ms step:3679/6710 train_time:830983ms step_avg:225.87ms step:3680/6710 train_time:831219ms step_avg:225.87ms step:3681/6710 train_time:831455ms step_avg:225.88ms step:3682/6710 train_time:831690ms step_avg:225.88ms step:3683/6710 train_time:831925ms step_avg:225.88ms step:3684/6710 train_time:832161ms step_avg:225.89ms step:3685/6710 train_time:832394ms step_avg:225.89ms step:3686/6710 train_time:832628ms step_avg:225.89ms step:3687/6710 train_time:832862ms step_avg:225.89ms step:3688/6710 train_time:833096ms step_avg:225.89ms step:3689/6710 train_time:833330ms step_avg:225.90ms step:3690/6710 train_time:833564ms step_avg:225.90ms step:3691/6710 train_time:833799ms step_avg:225.90ms step:3692/6710 train_time:834031ms step_avg:225.90ms step:3693/6710 train_time:834268ms step_avg:225.91ms step:3694/6710 train_time:834504ms step_avg:225.91ms step:3695/6710 train_time:834737ms step_avg:225.91ms step:3696/6710 train_time:834971ms step_avg:225.91ms step:3697/6710 train_time:835205ms step_avg:225.91ms step:3698/6710 train_time:835441ms step_avg:225.92ms step:3699/6710 train_time:835675ms step_avg:225.92ms step:3700/6710 train_time:835909ms step_avg:225.92ms step:3701/6710 train_time:836145ms step_avg:225.92ms step:3702/6710 train_time:836380ms step_avg:225.93ms step:3703/6710 train_time:836613ms step_avg:225.93ms step:3704/6710 train_time:836849ms step_avg:225.93ms step:3705/6710 train_time:837085ms step_avg:225.93ms step:3706/6710 train_time:837318ms step_avg:225.94ms step:3707/6710 train_time:837552ms step_avg:225.94ms step:3708/6710 train_time:837787ms step_avg:225.94ms step:3709/6710 train_time:838022ms step_avg:225.94ms step:3710/6710 train_time:838257ms step_avg:225.95ms step:3711/6710 train_time:838492ms step_avg:225.95ms step:3712/6710 train_time:838729ms step_avg:225.95ms step:3713/6710 train_time:838963ms step_avg:225.95ms step:3714/6710 train_time:839197ms step_avg:225.95ms step:3715/6710 train_time:839432ms step_avg:225.96ms step:3716/6710 train_time:839666ms step_avg:225.96ms step:3717/6710 train_time:839901ms step_avg:225.96ms step:3718/6710 train_time:840137ms step_avg:225.96ms step:3719/6710 train_time:840371ms step_avg:225.97ms step:3720/6710 train_time:840606ms step_avg:225.97ms step:3721/6710 train_time:840840ms step_avg:225.97ms step:3722/6710 train_time:841074ms step_avg:225.97ms step:3723/6710 train_time:841308ms step_avg:225.98ms step:3724/6710 train_time:841543ms step_avg:225.98ms step:3725/6710 train_time:841777ms step_avg:225.98ms step:3726/6710 train_time:842011ms step_avg:225.98ms step:3727/6710 train_time:842248ms step_avg:225.99ms step:3728/6710 train_time:842481ms step_avg:225.99ms step:3729/6710 train_time:842717ms step_avg:225.99ms step:3730/6710 train_time:842950ms step_avg:225.99ms step:3731/6710 train_time:843186ms step_avg:225.99ms step:3732/6710 train_time:843421ms step_avg:226.00ms step:3733/6710 train_time:843654ms step_avg:226.00ms step:3734/6710 train_time:843889ms step_avg:226.00ms step:3735/6710 train_time:844124ms step_avg:226.00ms step:3736/6710 train_time:844358ms step_avg:226.01ms step:3737/6710 train_time:844593ms step_avg:226.01ms step:3738/6710 train_time:844828ms step_avg:226.01ms step:3739/6710 train_time:845063ms step_avg:226.01ms step:3740/6710 train_time:845297ms step_avg:226.02ms step:3741/6710 train_time:845531ms step_avg:226.02ms step:3742/6710 train_time:845766ms step_avg:226.02ms step:3743/6710 train_time:846000ms step_avg:226.02ms step:3744/6710 train_time:846237ms step_avg:226.02ms step:3745/6710 train_time:846469ms step_avg:226.03ms step:3746/6710 train_time:846705ms step_avg:226.03ms step:3747/6710 train_time:846939ms step_avg:226.03ms step:3748/6710 train_time:847173ms step_avg:226.03ms step:3749/6710 train_time:847408ms step_avg:226.04ms step:3750/6710 train_time:847642ms step_avg:226.04ms step:3750/6710 val_loss:3.102041 train_time:847828ms step_avg:226.09ms Parameter containing: tensor([1.0000, 1.0000, 0.4165, 1.0000, 0.5662, 1.0000, 0.4784, 1.0000], device='cuda:0', requires_grad=True) 0 [7.545287609100342, 6.545285701751709] 1 [0.5235905647277832, 6.369290828704834] 2 [0.7500855922698975, 4.601396083831787] 3 [0.6866392493247986, 3.794356107711792] 4 [0.352576345205307, 2.7291972637176514] 5 [0.7180224657058716, 3.906754732131958] 6 [0.5065188407897949, 2.9370481967926025] 7 [0.7579123377799988, 5.699068069458008] 8 [0.4501979649066925, 1.3185722827911377] 9 [0.48739001154899597, 2.3554930686950684] 10 [0.6544721126556396, 2.924184799194336] 11 [0.43726345896720886, 3.047549247741699] 12 [0.9338579177856445, 6.218005180358887] 13 [1.0457934141159058, 3.538172483444214] 14 [0.9631032347679138, 1.716055989265442] 15 [0.8373539447784424, 0.8305560350418091] 0 [14.08658504486084, 26.852052688598633, 31.715578079223633] 1 [30.770166397094727, 28.492610931396484, 71.69889831542969] 2 [72.32392120361328, 23.704084396362305, 31.230562210083008] 3 [66.35763549804688, 30.5989990234375, 36.468021392822266] 4 [35.53717803955078, 27.717498779296875, 28.796192169189453] 5 [50.48215866088867, 26.967647552490234, 39.91780090332031] 6 [45.10912322998047, 30.31437110900879, 29.33209228515625] 7 [60.8105354309082, 0.0, 46.07073211669922] 8 [40.35920715332031, 31.56369972229004, 46.77005386352539] 9 [57.94377136230469, 27.229293823242188, 37.430816650390625] 10 [79.24982452392578, 27.516386032104492, 36.33212661743164] 11 [61.3842658996582, 34.01731491088867, 20.845134735107422] 12 [89.95101165771484, 26.33920669555664, 22.965320587158203] 13 [121.25373840332031, 21.724458694458008, 29.04964256286621] 14 [133.74160766601562, 26.072704315185547, 40.560096740722656] 15 [131.2758331298828, 88.07893371582031, 145.3344268798828] step:3751/6710 train_time:847879ms step_avg:226.04ms step:3752/6710 train_time:848110ms step_avg:226.04ms step:3753/6710 train_time:848348ms step_avg:226.05ms step:3754/6710 train_time:848582ms step_avg:226.05ms step:3755/6710 train_time:848819ms step_avg:226.05ms step:3756/6710 train_time:849054ms step_avg:226.05ms step:3757/6710 train_time:849288ms step_avg:226.05ms step:3758/6710 train_time:849523ms step_avg:226.06ms step:3759/6710 train_time:849757ms step_avg:226.06ms step:3760/6710 train_time:849992ms step_avg:226.06ms step:3761/6710 train_time:850227ms step_avg:226.06ms step:3762/6710 train_time:850461ms step_avg:226.07ms step:3763/6710 train_time:850697ms step_avg:226.07ms step:3764/6710 train_time:850931ms step_avg:226.07ms step:3765/6710 train_time:851165ms step_avg:226.07ms step:3766/6710 train_time:851728ms step_avg:226.16ms step:3767/6710 train_time:851980ms step_avg:226.17ms step:3768/6710 train_time:852211ms step_avg:226.17ms step:3769/6710 train_time:852442ms step_avg:226.17ms step:3770/6710 train_time:852674ms step_avg:226.17ms step:3771/6710 train_time:852914ms step_avg:226.18ms step:3772/6710 train_time:853151ms step_avg:226.18ms step:3773/6710 train_time:853386ms step_avg:226.18ms step:3774/6710 train_time:853618ms step_avg:226.18ms step:3775/6710 train_time:853852ms step_avg:226.19ms step:3776/6710 train_time:854090ms step_avg:226.19ms step:3777/6710 train_time:854323ms step_avg:226.19ms step:3778/6710 train_time:854557ms step_avg:226.19ms step:3779/6710 train_time:854791ms step_avg:226.19ms step:3780/6710 train_time:855026ms step_avg:226.20ms step:3781/6710 train_time:855260ms step_avg:226.20ms step:3782/6710 train_time:855495ms step_avg:226.20ms step:3783/6710 train_time:855729ms step_avg:226.20ms step:3784/6710 train_time:855963ms step_avg:226.21ms step:3785/6710 train_time:856198ms step_avg:226.21ms step:3786/6710 train_time:856434ms step_avg:226.21ms step:3787/6710 train_time:856668ms step_avg:226.21ms step:3788/6710 train_time:856902ms step_avg:226.21ms step:3789/6710 train_time:857137ms step_avg:226.22ms step:3790/6710 train_time:857372ms step_avg:226.22ms step:3791/6710 train_time:857610ms step_avg:226.22ms step:3792/6710 train_time:857843ms step_avg:226.22ms step:3793/6710 train_time:858078ms step_avg:226.23ms step:3794/6710 train_time:858314ms step_avg:226.23ms step:3795/6710 train_time:858549ms step_avg:226.23ms step:3796/6710 train_time:858781ms step_avg:226.23ms step:3797/6710 train_time:859016ms step_avg:226.24ms step:3798/6710 train_time:859252ms step_avg:226.24ms step:3799/6710 train_time:859486ms step_avg:226.24ms step:3800/6710 train_time:859721ms step_avg:226.24ms step:3801/6710 train_time:859956ms step_avg:226.24ms step:3802/6710 train_time:860192ms step_avg:226.25ms step:3803/6710 train_time:860427ms step_avg:226.25ms step:3804/6710 train_time:860659ms step_avg:226.25ms step:3805/6710 train_time:860893ms step_avg:226.25ms step:3806/6710 train_time:861126ms step_avg:226.25ms step:3807/6710 train_time:861361ms step_avg:226.26ms step:3808/6710 train_time:861596ms step_avg:226.26ms step:3809/6710 train_time:861831ms step_avg:226.26ms step:3810/6710 train_time:862067ms step_avg:226.26ms step:3811/6710 train_time:862302ms step_avg:226.27ms step:3812/6710 train_time:862536ms step_avg:226.27ms step:3813/6710 train_time:862771ms step_avg:226.27ms step:3814/6710 train_time:863009ms step_avg:226.27ms step:3815/6710 train_time:863243ms step_avg:226.28ms step:3816/6710 train_time:863478ms step_avg:226.28ms step:3817/6710 train_time:863712ms step_avg:226.28ms step:3818/6710 train_time:863948ms step_avg:226.28ms step:3819/6710 train_time:864181ms step_avg:226.28ms step:3820/6710 train_time:864415ms step_avg:226.29ms step:3821/6710 train_time:864650ms step_avg:226.29ms step:3822/6710 train_time:864885ms step_avg:226.29ms step:3823/6710 train_time:865119ms step_avg:226.29ms step:3824/6710 train_time:865354ms step_avg:226.30ms step:3825/6710 train_time:865589ms step_avg:226.30ms step:3826/6710 train_time:865823ms step_avg:226.30ms step:3827/6710 train_time:866058ms step_avg:226.30ms step:3828/6710 train_time:866292ms step_avg:226.30ms step:3829/6710 train_time:866531ms step_avg:226.31ms step:3830/6710 train_time:866765ms step_avg:226.31ms step:3831/6710 train_time:866999ms step_avg:226.31ms step:3832/6710 train_time:867233ms step_avg:226.31ms step:3833/6710 train_time:867467ms step_avg:226.32ms step:3834/6710 train_time:867701ms step_avg:226.32ms step:3835/6710 train_time:867938ms step_avg:226.32ms step:3836/6710 train_time:868173ms step_avg:226.32ms step:3837/6710 train_time:868409ms step_avg:226.32ms step:3838/6710 train_time:868645ms step_avg:226.33ms step:3839/6710 train_time:868882ms step_avg:226.33ms step:3840/6710 train_time:869121ms step_avg:226.33ms step:3841/6710 train_time:869358ms step_avg:226.34ms step:3842/6710 train_time:869593ms step_avg:226.34ms step:3843/6710 train_time:869830ms step_avg:226.34ms step:3844/6710 train_time:870063ms step_avg:226.34ms step:3845/6710 train_time:870299ms step_avg:226.35ms step:3846/6710 train_time:870533ms step_avg:226.35ms step:3847/6710 train_time:870768ms step_avg:226.35ms step:3848/6710 train_time:871002ms step_avg:226.35ms step:3849/6710 train_time:871238ms step_avg:226.35ms step:3850/6710 train_time:871472ms step_avg:226.36ms step:3851/6710 train_time:871706ms step_avg:226.36ms step:3852/6710 train_time:871942ms step_avg:226.36ms step:3853/6710 train_time:872180ms step_avg:226.36ms step:3854/6710 train_time:872414ms step_avg:226.37ms step:3855/6710 train_time:872649ms step_avg:226.37ms step:3856/6710 train_time:872886ms step_avg:226.37ms step:3857/6710 train_time:873120ms step_avg:226.37ms step:3858/6710 train_time:873354ms step_avg:226.37ms step:3859/6710 train_time:873592ms step_avg:226.38ms step:3860/6710 train_time:873829ms step_avg:226.38ms step:3861/6710 train_time:874064ms step_avg:226.38ms step:3862/6710 train_time:874299ms step_avg:226.38ms step:3863/6710 train_time:874535ms step_avg:226.39ms step:3864/6710 train_time:874772ms step_avg:226.39ms step:3865/6710 train_time:875004ms step_avg:226.39ms step:3866/6710 train_time:875239ms step_avg:226.39ms step:3867/6710 train_time:875473ms step_avg:226.40ms step:3868/6710 train_time:875709ms step_avg:226.40ms step:3869/6710 train_time:875943ms step_avg:226.40ms step:3870/6710 train_time:876177ms step_avg:226.40ms step:3871/6710 train_time:876413ms step_avg:226.40ms step:3872/6710 train_time:876647ms step_avg:226.41ms step:3873/6710 train_time:876882ms step_avg:226.41ms step:3874/6710 train_time:877117ms step_avg:226.41ms step:3875/6710 train_time:877351ms step_avg:226.41ms step:3875/6710 val_loss:3.093429 train_time:877537ms step_avg:226.46ms Parameter containing: tensor([1.0000, 1.0000, 0.4109, 1.0000, 0.5571, 1.0000, 0.4740, 1.0000], device='cuda:0', requires_grad=True) 0 [7.579920768737793, 6.57991886138916] 1 [0.520490825176239, 6.373043537139893] 2 [0.7386270761489868, 4.554337024688721] 3 [0.6853185296058655, 3.7700719833374023] 4 [0.3596896827220917, 2.7226271629333496] 5 [0.6996417045593262, 3.862746000289917] 6 [0.5059832334518433, 2.8733911514282227] 7 [0.7594902515411377, 5.652342796325684] 8 [0.4535143971443176, 1.2434419393539429] 9 [0.49364715814590454, 2.2802183628082275] 10 [0.6535590291023254, 2.8736486434936523] 11 [0.43643316626548767, 3.007080554962158] 12 [0.922409176826477, 6.182650566101074] 13 [1.0384668111801147, 3.5072858333587646] 14 [0.962509274482727, 1.6540004014968872] 15 [0.8413163423538208, 0.7249727845191956] 0 [14.157110214233398, 26.71445655822754, 31.927946090698242] 1 [30.635704040527344, 28.297771453857422, 70.36837768554688] 2 [70.22859954833984, 23.54677963256836, 30.8914794921875] 3 [64.82447052001953, 30.328121185302734, 36.605918884277344] 4 [35.74639892578125, 27.538455963134766, 28.88350486755371] 5 [49.27695846557617, 26.9589786529541, 39.20067596435547] 6 [44.21434783935547, 30.101764678955078, 28.91454315185547] 7 [59.922637939453125, 0.0, 45.32584762573242] 8 [40.00190734863281, 31.183401107788086, 46.61444854736328] 9 [57.85112380981445, 27.103633880615234, 37.22749328613281] 10 [78.44393920898438, 27.366024017333984, 36.1861686706543] 11 [60.40944290161133, 33.57851791381836, 20.73008918762207] 12 [87.60714721679688, 26.247499465942383, 22.650144577026367] 13 [117.77364349365234, 21.5335750579834, 28.49675178527832] 14 [130.15774536132812, 25.735864639282227, 39.90911865234375] 15 [128.66839599609375, 87.29358673095703, 142.00753784179688] step:3876/6710 train_time:877588ms step_avg:226.42ms step:3877/6710 train_time:877821ms step_avg:226.42ms step:3878/6710 train_time:878058ms step_avg:226.42ms step:3879/6710 train_time:878290ms step_avg:226.42ms step:3880/6710 train_time:878527ms step_avg:226.42ms step:3881/6710 train_time:878764ms step_avg:226.43ms step:3882/6710 train_time:879000ms step_avg:226.43ms step:3883/6710 train_time:879233ms step_avg:226.43ms step:3884/6710 train_time:879469ms step_avg:226.43ms step:3885/6710 train_time:879705ms step_avg:226.44ms step:3886/6710 train_time:879940ms step_avg:226.44ms step:3887/6710 train_time:880174ms step_avg:226.44ms step:3888/6710 train_time:880406ms step_avg:226.44ms step:3889/6710 train_time:880641ms step_avg:226.44ms step:3890/6710 train_time:880876ms step_avg:226.45ms step:3891/6710 train_time:881110ms step_avg:226.45ms step:3892/6710 train_time:881344ms step_avg:226.45ms step:3893/6710 train_time:881577ms step_avg:226.45ms step:3894/6710 train_time:881810ms step_avg:226.45ms step:3895/6710 train_time:882047ms step_avg:226.46ms step:3896/6710 train_time:882282ms step_avg:226.46ms step:3897/6710 train_time:882515ms step_avg:226.46ms step:3898/6710 train_time:882749ms step_avg:226.46ms step:3899/6710 train_time:882985ms step_avg:226.46ms step:3900/6710 train_time:883220ms step_avg:226.47ms step:3901/6710 train_time:883454ms step_avg:226.47ms step:3902/6710 train_time:883689ms step_avg:226.47ms step:3903/6710 train_time:883924ms step_avg:226.47ms step:3904/6710 train_time:884158ms step_avg:226.47ms step:3905/6710 train_time:884392ms step_avg:226.48ms step:3906/6710 train_time:884627ms step_avg:226.48ms step:3907/6710 train_time:884862ms step_avg:226.48ms step:3908/6710 train_time:885098ms step_avg:226.48ms step:3909/6710 train_time:885332ms step_avg:226.49ms step:3910/6710 train_time:885567ms step_avg:226.49ms step:3911/6710 train_time:885802ms step_avg:226.49ms step:3912/6710 train_time:886038ms step_avg:226.49ms step:3913/6710 train_time:886272ms step_avg:226.49ms step:3914/6710 train_time:886507ms step_avg:226.50ms step:3915/6710 train_time:886743ms step_avg:226.50ms step:3916/6710 train_time:886977ms step_avg:226.50ms step:3917/6710 train_time:887215ms step_avg:226.50ms step:3918/6710 train_time:887452ms step_avg:226.51ms step:3919/6710 train_time:887687ms step_avg:226.51ms step:3920/6710 train_time:887923ms step_avg:226.51ms step:3921/6710 train_time:888159ms step_avg:226.51ms step:3922/6710 train_time:888393ms step_avg:226.52ms step:3923/6710 train_time:888627ms step_avg:226.52ms step:3924/6710 train_time:888863ms step_avg:226.52ms step:3925/6710 train_time:889097ms step_avg:226.52ms step:3926/6710 train_time:889330ms step_avg:226.52ms step:3927/6710 train_time:889564ms step_avg:226.53ms step:3928/6710 train_time:889799ms step_avg:226.53ms step:3929/6710 train_time:890033ms step_avg:226.53ms step:3930/6710 train_time:890268ms step_avg:226.53ms step:3931/6710 train_time:890504ms step_avg:226.53ms step:3932/6710 train_time:890739ms step_avg:226.54ms step:3933/6710 train_time:890974ms step_avg:226.54ms step:3934/6710 train_time:891207ms step_avg:226.54ms step:3935/6710 train_time:891445ms step_avg:226.54ms step:3936/6710 train_time:891680ms step_avg:226.54ms step:3937/6710 train_time:891918ms step_avg:226.55ms step:3938/6710 train_time:892152ms step_avg:226.55ms step:3939/6710 train_time:892386ms step_avg:226.55ms step:3940/6710 train_time:892623ms step_avg:226.55ms step:3941/6710 train_time:892857ms step_avg:226.56ms step:3942/6710 train_time:893094ms step_avg:226.56ms step:3943/6710 train_time:893326ms step_avg:226.56ms step:3944/6710 train_time:893561ms step_avg:226.56ms step:3945/6710 train_time:893794ms step_avg:226.56ms step:3946/6710 train_time:894028ms step_avg:226.57ms step:3947/6710 train_time:894264ms step_avg:226.57ms step:3948/6710 train_time:894499ms step_avg:226.57ms step:3949/6710 train_time:894737ms step_avg:226.57ms step:3950/6710 train_time:894972ms step_avg:226.58ms step:3951/6710 train_time:895206ms step_avg:226.58ms step:3952/6710 train_time:895441ms step_avg:226.58ms step:3953/6710 train_time:895677ms step_avg:226.58ms step:3954/6710 train_time:895914ms step_avg:226.58ms step:3955/6710 train_time:896149ms step_avg:226.59ms step:3956/6710 train_time:896383ms step_avg:226.59ms step:3957/6710 train_time:896617ms step_avg:226.59ms step:3958/6710 train_time:896853ms step_avg:226.59ms step:3959/6710 train_time:897087ms step_avg:226.59ms step:3960/6710 train_time:897321ms step_avg:226.60ms step:3961/6710 train_time:897555ms step_avg:226.60ms step:3962/6710 train_time:897789ms step_avg:226.60ms step:3963/6710 train_time:898024ms step_avg:226.60ms step:3964/6710 train_time:898260ms step_avg:226.60ms step:3965/6710 train_time:898492ms step_avg:226.61ms step:3966/6710 train_time:898725ms step_avg:226.61ms step:3967/6710 train_time:898960ms step_avg:226.61ms step:3968/6710 train_time:899195ms step_avg:226.61ms step:3969/6710 train_time:899428ms step_avg:226.61ms step:3970/6710 train_time:899664ms step_avg:226.62ms step:3971/6710 train_time:899897ms step_avg:226.62ms step:3972/6710 train_time:900131ms step_avg:226.62ms step:3973/6710 train_time:900366ms step_avg:226.62ms step:3974/6710 train_time:900601ms step_avg:226.62ms step:3975/6710 train_time:900836ms step_avg:226.63ms step:3976/6710 train_time:901074ms step_avg:226.63ms step:3977/6710 train_time:901307ms step_avg:226.63ms step:3978/6710 train_time:901542ms step_avg:226.63ms step:3979/6710 train_time:901776ms step_avg:226.63ms step:3980/6710 train_time:902012ms step_avg:226.64ms step:3981/6710 train_time:902247ms step_avg:226.64ms step:3982/6710 train_time:902482ms step_avg:226.64ms step:3983/6710 train_time:902716ms step_avg:226.64ms step:3984/6710 train_time:902950ms step_avg:226.64ms step:3985/6710 train_time:903186ms step_avg:226.65ms step:3986/6710 train_time:903422ms step_avg:226.65ms step:3987/6710 train_time:903655ms step_avg:226.65ms step:3988/6710 train_time:903890ms step_avg:226.65ms step:3989/6710 train_time:904125ms step_avg:226.65ms step:3990/6710 train_time:904361ms step_avg:226.66ms step:3991/6710 train_time:904596ms step_avg:226.66ms step:3992/6710 train_time:904830ms step_avg:226.66ms step:3993/6710 train_time:905066ms step_avg:226.66ms step:3994/6710 train_time:905301ms step_avg:226.67ms step:3995/6710 train_time:905536ms step_avg:226.67ms step:3996/6710 train_time:905771ms step_avg:226.67ms step:3997/6710 train_time:906005ms step_avg:226.67ms step:3998/6710 train_time:906240ms step_avg:226.67ms step:3999/6710 train_time:906475ms step_avg:226.68ms step:4000/6710 train_time:906709ms step_avg:226.68ms step:4000/6710 val_loss:3.081564 train_time:906898ms step_avg:226.72ms Parameter containing: tensor([1.0000, 1.0000, 0.4143, 1.0000, 0.5550, 1.0000, 0.4598, 1.0000], device='cuda:0', requires_grad=True) 0 [7.598257064819336, 6.598255157470703] 1 [0.5090423226356506, 6.384069442749023] 2 [0.7273722290992737, 4.484886646270752] 3 [0.6932698488235474, 3.7324414253234863] 4 [0.3627432882785797, 2.702643394470215] 5 [0.6873158812522888, 3.7948780059814453] 6 [0.5092489719390869, 2.7917025089263916] 7 [0.7513551712036133, 5.590745449066162] 8 [0.45805028080940247, 1.153021216392517] 9 [0.48390793800354004, 2.2240498065948486] 10 [0.6472908854484558, 2.8175551891326904] 11 [0.4392656683921814, 2.9507639408111572] 12 [0.9162172079086304, 6.1636576652526855] 13 [1.0315985679626465, 3.473520278930664] 14 [0.9580286741256714, 1.5860953330993652] 15 [0.8436176180839539, 0.6274995803833008] 0 [14.1951322555542, 26.419260025024414, 31.697721481323242] 1 [29.89772605895996, 28.0598201751709, 69.84358978271484] 2 [68.27367401123047, 23.106287002563477, 30.534656524658203] 3 [63.91908264160156, 29.894367218017578, 35.89604187011719] 4 [35.44925308227539, 27.171613693237305, 28.817176818847656] 5 [47.98943328857422, 26.602413177490234, 38.68378448486328] 6 [43.541419982910156, 29.815332412719727, 28.798259735107422] 7 [58.54811477661133, 0.0, 44.14603805541992] 8 [39.35334396362305, 30.739267349243164, 45.404457092285156] 9 [55.220882415771484, 26.661373138427734, 36.91489791870117] 10 [75.51065063476562, 27.163808822631836, 35.89515686035156] 11 [59.16328430175781, 33.38521957397461, 20.892475128173828] 12 [85.86266326904297, 26.103906631469727, 22.71653938293457] 13 [115.20796203613281, 21.210268020629883, 28.429338455200195] 14 [127.06330871582031, 25.167612075805664, 39.691802978515625] 15 [126.24959564208984, 85.89765930175781, 140.4779510498047] step:4001/6710 train_time:906949ms step_avg:226.68ms step:4002/6710 train_time:907180ms step_avg:226.68ms step:4003/6710 train_time:907421ms step_avg:226.69ms step:4004/6710 train_time:907652ms step_avg:226.69ms step:4005/6710 train_time:907893ms step_avg:226.69ms step:4006/6710 train_time:908129ms step_avg:226.69ms step:4007/6710 train_time:908367ms step_avg:226.70ms step:4008/6710 train_time:908601ms step_avg:226.70ms step:4009/6710 train_time:908835ms step_avg:226.70ms step:4010/6710 train_time:909072ms step_avg:226.70ms step:4011/6710 train_time:909309ms step_avg:226.70ms step:4012/6710 train_time:909546ms step_avg:226.71ms step:4013/6710 train_time:909780ms step_avg:226.71ms step:4014/6710 train_time:910014ms step_avg:226.71ms step:4015/6710 train_time:910250ms step_avg:226.71ms step:4016/6710 train_time:910488ms step_avg:226.72ms step:4017/6710 train_time:910720ms step_avg:226.72ms step:4018/6710 train_time:910955ms step_avg:226.72ms step:4019/6710 train_time:911194ms step_avg:226.72ms step:4020/6710 train_time:911428ms step_avg:226.72ms step:4021/6710 train_time:911664ms step_avg:226.73ms step:4022/6710 train_time:911898ms step_avg:226.73ms step:4023/6710 train_time:912133ms step_avg:226.73ms step:4024/6710 train_time:912372ms step_avg:226.73ms step:4025/6710 train_time:912607ms step_avg:226.73ms step:4026/6710 train_time:912842ms step_avg:226.74ms step:4027/6710 train_time:913076ms step_avg:226.74ms step:4028/6710 train_time:913313ms step_avg:226.74ms step:4029/6710 train_time:913548ms step_avg:226.74ms step:4030/6710 train_time:913782ms step_avg:226.74ms step:4031/6710 train_time:914019ms step_avg:226.75ms step:4032/6710 train_time:914254ms step_avg:226.75ms step:4033/6710 train_time:914490ms step_avg:226.75ms step:4034/6710 train_time:914723ms step_avg:226.75ms step:4035/6710 train_time:914957ms step_avg:226.76ms step:4036/6710 train_time:915194ms step_avg:226.76ms step:4037/6710 train_time:915428ms step_avg:226.76ms step:4038/6710 train_time:915663ms step_avg:226.76ms step:4039/6710 train_time:915898ms step_avg:226.76ms step:4040/6710 train_time:916133ms step_avg:226.77ms step:4041/6710 train_time:916367ms step_avg:226.77ms step:4042/6710 train_time:916601ms step_avg:226.77ms step:4043/6710 train_time:916836ms step_avg:226.77ms step:4044/6710 train_time:917071ms step_avg:226.77ms step:4045/6710 train_time:917308ms step_avg:226.78ms step:4046/6710 train_time:917544ms step_avg:226.78ms step:4047/6710 train_time:917780ms step_avg:226.78ms step:4048/6710 train_time:918014ms step_avg:226.78ms step:4049/6710 train_time:918249ms step_avg:226.78ms step:4050/6710 train_time:918484ms step_avg:226.79ms step:4051/6710 train_time:918720ms step_avg:226.79ms step:4052/6710 train_time:918956ms step_avg:226.79ms step:4053/6710 train_time:919190ms step_avg:226.79ms step:4054/6710 train_time:919424ms step_avg:226.79ms step:4055/6710 train_time:919660ms step_avg:226.80ms step:4056/6710 train_time:919894ms step_avg:226.80ms step:4057/6710 train_time:920127ms step_avg:226.80ms step:4058/6710 train_time:920361ms step_avg:226.80ms step:4059/6710 train_time:920594ms step_avg:226.80ms step:4060/6710 train_time:920832ms step_avg:226.81ms step:4061/6710 train_time:921067ms step_avg:226.81ms step:4062/6710 train_time:921302ms step_avg:226.81ms step:4063/6710 train_time:921536ms step_avg:226.81ms step:4064/6710 train_time:921773ms step_avg:226.81ms step:4065/6710 train_time:922009ms step_avg:226.82ms step:4066/6710 train_time:922242ms step_avg:226.82ms step:4067/6710 train_time:922477ms step_avg:226.82ms step:4068/6710 train_time:922713ms step_avg:226.82ms step:4069/6710 train_time:922947ms step_avg:226.82ms step:4070/6710 train_time:923183ms step_avg:226.83ms step:4071/6710 train_time:923419ms step_avg:226.83ms step:4072/6710 train_time:923654ms step_avg:226.83ms step:4073/6710 train_time:923889ms step_avg:226.83ms step:4074/6710 train_time:924124ms step_avg:226.83ms step:4075/6710 train_time:924360ms step_avg:226.84ms step:4076/6710 train_time:924594ms step_avg:226.84ms step:4077/6710 train_time:924833ms step_avg:226.84ms step:4078/6710 train_time:925068ms step_avg:226.84ms step:4079/6710 train_time:925302ms step_avg:226.85ms step:4080/6710 train_time:925536ms step_avg:226.85ms step:4081/6710 train_time:925774ms step_avg:226.85ms step:4082/6710 train_time:926009ms step_avg:226.85ms step:4083/6710 train_time:926244ms step_avg:226.85ms step:4084/6710 train_time:926480ms step_avg:226.86ms step:4085/6710 train_time:926716ms step_avg:226.86ms step:4086/6710 train_time:926955ms step_avg:226.86ms step:4087/6710 train_time:927192ms step_avg:226.86ms step:4088/6710 train_time:927426ms step_avg:226.87ms step:4089/6710 train_time:927661ms step_avg:226.87ms step:4090/6710 train_time:927897ms step_avg:226.87ms step:4091/6710 train_time:928132ms step_avg:226.87ms step:4092/6710 train_time:928368ms step_avg:226.87ms step:4093/6710 train_time:928602ms step_avg:226.88ms step:4094/6710 train_time:928836ms step_avg:226.88ms step:4095/6710 train_time:929072ms step_avg:226.88ms step:4096/6710 train_time:929309ms step_avg:226.88ms step:4097/6710 train_time:929543ms step_avg:226.88ms step:4098/6710 train_time:929782ms step_avg:226.89ms step:4099/6710 train_time:930016ms step_avg:226.89ms step:4100/6710 train_time:930252ms step_avg:226.89ms step:4101/6710 train_time:930487ms step_avg:226.89ms step:4102/6710 train_time:930725ms step_avg:226.90ms step:4103/6710 train_time:930958ms step_avg:226.90ms step:4104/6710 train_time:931196ms step_avg:226.90ms step:4105/6710 train_time:931433ms step_avg:226.90ms step:4106/6710 train_time:931669ms step_avg:226.90ms step:4107/6710 train_time:931906ms step_avg:226.91ms step:4108/6710 train_time:932141ms step_avg:226.91ms step:4109/6710 train_time:932374ms step_avg:226.91ms step:4110/6710 train_time:932611ms step_avg:226.91ms step:4111/6710 train_time:932845ms step_avg:226.91ms step:4112/6710 train_time:933079ms step_avg:226.92ms step:4113/6710 train_time:933316ms step_avg:226.92ms step:4114/6710 train_time:933550ms step_avg:226.92ms step:4115/6710 train_time:933785ms step_avg:226.92ms step:4116/6710 train_time:934022ms step_avg:226.92ms step:4117/6710 train_time:934256ms step_avg:226.93ms step:4118/6710 train_time:934492ms step_avg:226.93ms step:4119/6710 train_time:934728ms step_avg:226.93ms step:4120/6710 train_time:934964ms step_avg:226.93ms step:4121/6710 train_time:935199ms step_avg:226.93ms step:4122/6710 train_time:935434ms step_avg:226.94ms step:4123/6710 train_time:935668ms step_avg:226.94ms step:4124/6710 train_time:935902ms step_avg:226.94ms step:4125/6710 train_time:936136ms step_avg:226.94ms step:4125/6710 val_loss:3.073889 train_time:936322ms step_avg:226.99ms Parameter containing: tensor([1.0000, 1.0000, 0.4082, 1.0000, 0.5486, 1.0000, 0.4648, 1.0000], device='cuda:0', requires_grad=True) 0 [7.617134094238281, 6.617132186889648] 1 [0.5048218965530396, 6.368176460266113] 2 [0.7201352119445801, 4.420363426208496] 3 [0.6833814978599548, 3.680783987045288] 4 [0.36875343322753906, 2.6762821674346924] 5 [0.6861620545387268, 3.725508213043213] 6 [0.5076944231987, 2.719187021255493] 7 [0.7367630004882812, 5.54660177230835] 8 [0.455836683511734, 1.0698201656341553] 9 [0.49064087867736816, 2.1623754501342773] 10 [0.6449736952781677, 2.76489520072937] 11 [0.4397636950016022, 2.9043850898742676] 12 [0.9106221795082092, 6.146800994873047] 13 [1.0218271017074585, 3.4434702396392822] 14 [0.9561921954154968, 1.520625352859497] 15 [0.8488185405731201, 0.5363385081291199] 0 [14.232992172241211, 26.319074630737305, 31.640602111816406] 1 [29.541622161865234, 27.73673439025879, 70.07344055175781] 2 [67.42650604248047, 22.762292861938477, 30.158937454223633] 3 [62.2082405090332, 29.58738136291504, 35.2240104675293] 4 [35.17861557006836, 26.894277572631836, 28.45329475402832] 5 [47.23823928833008, 26.07119369506836, 38.49325180053711] 6 [42.812808990478516, 29.54831314086914, 28.533788681030273] 7 [56.68492126464844, 0.0, 43.24335861206055] 8 [38.11907958984375, 30.374025344848633, 45.116294860839844] 9 [55.06160354614258, 26.56278419494629, 36.09403610229492] 10 [74.1763687133789, 26.979429244995117, 35.15850830078125] 11 [58.10601806640625, 33.0451545715332, 20.42378807067871] 12 [83.93035888671875, 25.98316764831543, 22.281227111816406] 13 [111.93177032470703, 20.81293487548828, 27.511625289916992] 14 [123.15161895751953, 24.598012924194336, 38.63654327392578] 15 [123.0665283203125, 84.80131530761719, 135.82167053222656] step:4126/6710 train_time:936373ms step_avg:226.94ms step:4127/6710 train_time:936607ms step_avg:226.95ms step:4128/6710 train_time:936846ms step_avg:226.95ms step:4129/6710 train_time:937079ms step_avg:226.95ms step:4130/6710 train_time:937317ms step_avg:226.95ms step:4131/6710 train_time:937551ms step_avg:226.95ms step:4132/6710 train_time:937787ms step_avg:226.96ms step:4133/6710 train_time:938020ms step_avg:226.96ms step:4134/6710 train_time:938257ms step_avg:226.96ms step:4135/6710 train_time:938492ms step_avg:226.96ms step:4136/6710 train_time:938731ms step_avg:226.97ms step:4137/6710 train_time:938965ms step_avg:226.97ms step:4138/6710 train_time:939199ms step_avg:226.97ms step:4139/6710 train_time:939434ms step_avg:226.97ms step:4140/6710 train_time:939671ms step_avg:226.97ms step:4141/6710 train_time:939908ms step_avg:226.98ms step:4142/6710 train_time:940141ms step_avg:226.98ms step:4143/6710 train_time:940375ms step_avg:226.98ms step:4144/6710 train_time:940610ms step_avg:226.98ms step:4145/6710 train_time:940846ms step_avg:226.98ms step:4146/6710 train_time:941082ms step_avg:226.99ms step:4147/6710 train_time:941315ms step_avg:226.99ms step:4148/6710 train_time:941550ms step_avg:226.99ms step:4149/6710 train_time:941789ms step_avg:226.99ms step:4150/6710 train_time:942023ms step_avg:226.99ms step:4151/6710 train_time:942257ms step_avg:227.00ms step:4152/6710 train_time:942494ms step_avg:227.00ms step:4153/6710 train_time:942726ms step_avg:227.00ms step:4154/6710 train_time:942959ms step_avg:227.00ms step:4155/6710 train_time:943193ms step_avg:227.00ms step:4156/6710 train_time:943433ms step_avg:227.01ms step:4157/6710 train_time:943671ms step_avg:227.01ms step:4158/6710 train_time:943905ms step_avg:227.01ms step:4159/6710 train_time:944141ms step_avg:227.01ms step:4160/6710 train_time:944376ms step_avg:227.01ms step:4161/6710 train_time:944613ms step_avg:227.02ms step:4162/6710 train_time:944850ms step_avg:227.02ms step:4163/6710 train_time:945087ms step_avg:227.02ms step:4164/6710 train_time:945323ms step_avg:227.02ms step:4165/6710 train_time:945556ms step_avg:227.02ms step:4166/6710 train_time:945794ms step_avg:227.03ms step:4167/6710 train_time:946029ms step_avg:227.03ms step:4168/6710 train_time:946263ms step_avg:227.03ms step:4169/6710 train_time:946498ms step_avg:227.03ms step:4170/6710 train_time:946734ms step_avg:227.03ms step:4171/6710 train_time:946970ms step_avg:227.04ms step:4172/6710 train_time:947205ms step_avg:227.04ms step:4173/6710 train_time:947440ms step_avg:227.04ms step:4174/6710 train_time:947676ms step_avg:227.04ms step:4175/6710 train_time:947911ms step_avg:227.04ms step:4176/6710 train_time:948147ms step_avg:227.05ms step:4177/6710 train_time:948385ms step_avg:227.05ms step:4178/6710 train_time:948621ms step_avg:227.05ms step:4179/6710 train_time:948854ms step_avg:227.05ms step:4180/6710 train_time:949089ms step_avg:227.05ms step:4181/6710 train_time:949325ms step_avg:227.06ms step:4182/6710 train_time:949563ms step_avg:227.06ms step:4183/6710 train_time:949796ms step_avg:227.06ms step:4184/6710 train_time:950028ms step_avg:227.06ms step:4185/6710 train_time:950265ms step_avg:227.06ms step:4186/6710 train_time:950499ms step_avg:227.07ms step:4187/6710 train_time:950734ms step_avg:227.07ms step:4188/6710 train_time:950969ms step_avg:227.07ms step:4189/6710 train_time:951204ms step_avg:227.07ms step:4190/6710 train_time:951441ms step_avg:227.07ms step:4191/6710 train_time:951679ms step_avg:227.08ms step:4192/6710 train_time:951913ms step_avg:227.08ms step:4193/6710 train_time:952146ms step_avg:227.08ms step:4194/6710 train_time:952380ms step_avg:227.08ms step:4195/6710 train_time:952615ms step_avg:227.08ms step:4196/6710 train_time:952849ms step_avg:227.08ms step:4197/6710 train_time:953085ms step_avg:227.09ms step:4198/6710 train_time:953320ms step_avg:227.09ms step:4199/6710 train_time:953558ms step_avg:227.09ms step:4200/6710 train_time:953793ms step_avg:227.09ms step:4201/6710 train_time:954028ms step_avg:227.10ms step:4202/6710 train_time:954263ms step_avg:227.10ms step:4203/6710 train_time:954497ms step_avg:227.10ms step:4204/6710 train_time:954732ms step_avg:227.10ms step:4205/6710 train_time:954968ms step_avg:227.10ms step:4206/6710 train_time:955203ms step_avg:227.10ms step:4207/6710 train_time:955436ms step_avg:227.11ms step:4208/6710 train_time:955670ms step_avg:227.11ms step:4209/6710 train_time:955905ms step_avg:227.11ms step:4210/6710 train_time:956137ms step_avg:227.11ms step:4211/6710 train_time:956372ms step_avg:227.11ms step:4212/6710 train_time:956611ms step_avg:227.12ms step:4213/6710 train_time:956847ms step_avg:227.12ms step:4214/6710 train_time:957082ms step_avg:227.12ms step:4215/6710 train_time:957317ms step_avg:227.12ms step:4216/6710 train_time:957553ms step_avg:227.12ms step:4217/6710 train_time:957786ms step_avg:227.12ms step:4218/6710 train_time:958021ms step_avg:227.13ms step:4219/6710 train_time:958255ms step_avg:227.13ms step:4220/6710 train_time:958491ms step_avg:227.13ms step:4221/6710 train_time:958726ms step_avg:227.13ms step:4222/6710 train_time:958960ms step_avg:227.13ms step:4223/6710 train_time:959197ms step_avg:227.14ms step:4224/6710 train_time:959432ms step_avg:227.14ms step:4225/6710 train_time:959669ms step_avg:227.14ms step:4226/6710 train_time:959901ms step_avg:227.14ms step:4227/6710 train_time:960136ms step_avg:227.14ms step:4228/6710 train_time:960372ms step_avg:227.15ms step:4229/6710 train_time:960608ms step_avg:227.15ms step:4230/6710 train_time:960841ms step_avg:227.15ms step:4231/6710 train_time:961074ms step_avg:227.15ms step:4232/6710 train_time:961308ms step_avg:227.15ms step:4233/6710 train_time:961545ms step_avg:227.15ms step:4234/6710 train_time:961779ms step_avg:227.16ms step:4235/6710 train_time:962013ms step_avg:227.16ms step:4236/6710 train_time:962247ms step_avg:227.16ms step:4237/6710 train_time:962481ms step_avg:227.16ms step:4238/6710 train_time:962715ms step_avg:227.16ms step:4239/6710 train_time:962951ms step_avg:227.16ms step:4240/6710 train_time:963187ms step_avg:227.17ms step:4241/6710 train_time:963423ms step_avg:227.17ms step:4242/6710 train_time:963656ms step_avg:227.17ms step:4243/6710 train_time:963890ms step_avg:227.17ms step:4244/6710 train_time:964126ms step_avg:227.17ms step:4245/6710 train_time:964361ms step_avg:227.18ms step:4246/6710 train_time:964597ms step_avg:227.18ms step:4247/6710 train_time:964833ms step_avg:227.18ms step:4248/6710 train_time:965069ms step_avg:227.18ms step:4249/6710 train_time:965306ms step_avg:227.18ms step:4250/6710 train_time:965540ms step_avg:227.19ms step:4250/6710 val_loss:3.065591 train_time:965723ms step_avg:227.23ms Parameter containing: tensor([1.0000, 1.0000, 0.4108, 1.0000, 0.5358, 1.0000, 0.4531, 1.0000], device='cuda:0', requires_grad=True) 0 [7.614380359649658, 6.614378452301025] 1 [0.5021954774856567, 6.332128047943115] 2 [0.7139480113983154, 4.340001583099365] 3 [0.6851356625556946, 3.619023323059082] 4 [0.367078959941864, 2.6368391513824463] 5 [0.671951174736023, 3.6373965740203857] 6 [0.5117736458778381, 2.6354565620422363] 7 [0.7324987649917603, 5.484143257141113] 8 [0.4699101746082306, 1.003973126411438] 9 [0.48891082406044006, 2.109588384628296] 10 [0.6438053846359253, 2.715550661087036] 11 [0.44255727529525757, 2.8361093997955322] 12 [0.9084824323654175, 6.088963508605957] 13 [1.0170084238052368, 3.3798279762268066] 14 [0.9571444392204285, 1.4378496408462524] 15 [0.8528643250465393, 0.4527212977409363] 0 [14.228697776794434, 25.901437759399414, 31.28289222717285] 1 [29.074825286865234, 27.44644546508789, 69.49911499023438] 2 [66.09345245361328, 22.35213851928711, 29.692895889282227] 3 [61.16435241699219, 29.18581771850586, 34.663211822509766] 4 [34.47438049316406, 26.4968204498291, 28.69540023803711] 5 [45.78367614746094, 25.767135620117188, 38.04091262817383] 6 [42.17700958251953, 29.05585479736328, 28.058372497558594] 7 [55.342166900634766, 0.0, 42.74860763549805] 8 [38.48783874511719, 29.84877586364746, 44.94474792480469] 9 [54.17729568481445, 26.031051635742188, 35.95252227783203] 10 [72.56304931640625, 26.414278030395508, 35.050682067871094] 11 [57.38196563720703, 32.504852294921875, 20.61395835876465] 12 [82.69083404541016, 25.739334106445312, 22.30390739440918] 13 [109.90950012207031, 20.014192581176758, 27.250656127929688] 14 [121.10646057128906, 24.114208221435547, 37.94306182861328] 15 [121.6399154663086, 83.0465087890625, 135.946044921875] step:4251/6710 train_time:965775ms step_avg:227.19ms step:4252/6710 train_time:966006ms step_avg:227.19ms step:4253/6710 train_time:966246ms step_avg:227.19ms step:4254/6710 train_time:966479ms step_avg:227.19ms step:4255/6710 train_time:966718ms step_avg:227.20ms step:4256/6710 train_time:966953ms step_avg:227.20ms step:4257/6710 train_time:967189ms step_avg:227.20ms step:4258/6710 train_time:967423ms step_avg:227.20ms step:4259/6710 train_time:967658ms step_avg:227.20ms step:4260/6710 train_time:967895ms step_avg:227.21ms step:4261/6710 train_time:968130ms step_avg:227.21ms step:4262/6710 train_time:968364ms step_avg:227.21ms step:4263/6710 train_time:968599ms step_avg:227.21ms step:4264/6710 train_time:968835ms step_avg:227.21ms step:4265/6710 train_time:969071ms step_avg:227.21ms step:4266/6710 train_time:969306ms step_avg:227.22ms step:4267/6710 train_time:969539ms step_avg:227.22ms step:4268/6710 train_time:969775ms step_avg:227.22ms step:4269/6710 train_time:970010ms step_avg:227.22ms step:4270/6710 train_time:970247ms step_avg:227.22ms step:4271/6710 train_time:970480ms step_avg:227.23ms step:4272/6710 train_time:970718ms step_avg:227.23ms step:4273/6710 train_time:970953ms step_avg:227.23ms step:4274/6710 train_time:971193ms step_avg:227.23ms step:4275/6710 train_time:971427ms step_avg:227.23ms step:4276/6710 train_time:971662ms step_avg:227.24ms step:4277/6710 train_time:971896ms step_avg:227.24ms step:4278/6710 train_time:972132ms step_avg:227.24ms step:4279/6710 train_time:972367ms step_avg:227.24ms step:4280/6710 train_time:972601ms step_avg:227.24ms step:4281/6710 train_time:972836ms step_avg:227.24ms step:4282/6710 train_time:973071ms step_avg:227.25ms step:4283/6710 train_time:973307ms step_avg:227.25ms step:4284/6710 train_time:973541ms step_avg:227.25ms step:4285/6710 train_time:973775ms step_avg:227.25ms step:4286/6710 train_time:974009ms step_avg:227.25ms step:4287/6710 train_time:974245ms step_avg:227.26ms step:4288/6710 train_time:974480ms step_avg:227.26ms step:4289/6710 train_time:974714ms step_avg:227.26ms step:4290/6710 train_time:974951ms step_avg:227.26ms step:4291/6710 train_time:975186ms step_avg:227.26ms step:4292/6710 train_time:975420ms step_avg:227.26ms step:4293/6710 train_time:975655ms step_avg:227.27ms step:4294/6710 train_time:975890ms step_avg:227.27ms step:4295/6710 train_time:976125ms step_avg:227.27ms step:4296/6710 train_time:976358ms step_avg:227.27ms step:4297/6710 train_time:976594ms step_avg:227.27ms step:4298/6710 train_time:976830ms step_avg:227.28ms step:4299/6710 train_time:977064ms step_avg:227.28ms step:4300/6710 train_time:977297ms step_avg:227.28ms step:4301/6710 train_time:977533ms step_avg:227.28ms step:4302/6710 train_time:977769ms step_avg:227.28ms step:4303/6710 train_time:978002ms step_avg:227.28ms step:4304/6710 train_time:978237ms step_avg:227.29ms step:4305/6710 train_time:978474ms step_avg:227.29ms step:4306/6710 train_time:978708ms step_avg:227.29ms step:4307/6710 train_time:978942ms step_avg:227.29ms step:4308/6710 train_time:979178ms step_avg:227.29ms step:4309/6710 train_time:979415ms step_avg:227.30ms step:4310/6710 train_time:979650ms step_avg:227.30ms step:4311/6710 train_time:979885ms step_avg:227.30ms step:4312/6710 train_time:980121ms step_avg:227.30ms step:4313/6710 train_time:980357ms step_avg:227.30ms step:4314/6710 train_time:980591ms step_avg:227.30ms step:4315/6710 train_time:980826ms step_avg:227.31ms step:4316/6710 train_time:981059ms step_avg:227.31ms step:4317/6710 train_time:981294ms step_avg:227.31ms step:4318/6710 train_time:981529ms step_avg:227.31ms step:4319/6710 train_time:981762ms step_avg:227.31ms step:4320/6710 train_time:981996ms step_avg:227.31ms step:4321/6710 train_time:982231ms step_avg:227.32ms step:4322/6710 train_time:982468ms step_avg:227.32ms step:4323/6710 train_time:982705ms step_avg:227.32ms step:4324/6710 train_time:982941ms step_avg:227.32ms step:4325/6710 train_time:983178ms step_avg:227.32ms step:4326/6710 train_time:983413ms step_avg:227.33ms step:4327/6710 train_time:983648ms step_avg:227.33ms step:4328/6710 train_time:983884ms step_avg:227.33ms step:4329/6710 train_time:984117ms step_avg:227.33ms step:4330/6710 train_time:984353ms step_avg:227.33ms step:4331/6710 train_time:984588ms step_avg:227.34ms step:4332/6710 train_time:984823ms step_avg:227.34ms step:4333/6710 train_time:985058ms step_avg:227.34ms step:4334/6710 train_time:985293ms step_avg:227.34ms step:4335/6710 train_time:985527ms step_avg:227.34ms step:4336/6710 train_time:985760ms step_avg:227.34ms step:4337/6710 train_time:985998ms step_avg:227.35ms step:4338/6710 train_time:986233ms step_avg:227.35ms step:4339/6710 train_time:986468ms step_avg:227.35ms step:4340/6710 train_time:986704ms step_avg:227.35ms step:4341/6710 train_time:986939ms step_avg:227.35ms step:4342/6710 train_time:987174ms step_avg:227.35ms step:4343/6710 train_time:987409ms step_avg:227.36ms step:4344/6710 train_time:987644ms step_avg:227.36ms step:4345/6710 train_time:987877ms step_avg:227.36ms step:4346/6710 train_time:988112ms step_avg:227.36ms step:4347/6710 train_time:988349ms step_avg:227.36ms step:4348/6710 train_time:988583ms step_avg:227.37ms step:4349/6710 train_time:988818ms step_avg:227.37ms step:4350/6710 train_time:989055ms step_avg:227.37ms step:4351/6710 train_time:989290ms step_avg:227.37ms step:4352/6710 train_time:989524ms step_avg:227.37ms step:4353/6710 train_time:989758ms step_avg:227.37ms step:4354/6710 train_time:989995ms step_avg:227.38ms step:4355/6710 train_time:990231ms step_avg:227.38ms step:4356/6710 train_time:990468ms step_avg:227.38ms step:4357/6710 train_time:990703ms step_avg:227.38ms step:4358/6710 train_time:990939ms step_avg:227.38ms step:4359/6710 train_time:991174ms step_avg:227.39ms step:4360/6710 train_time:991410ms step_avg:227.39ms step:4361/6710 train_time:991645ms step_avg:227.39ms step:4362/6710 train_time:991879ms step_avg:227.39ms step:4363/6710 train_time:992117ms step_avg:227.39ms step:4364/6710 train_time:992352ms step_avg:227.40ms step:4365/6710 train_time:992586ms step_avg:227.40ms step:4366/6710 train_time:992821ms step_avg:227.40ms step:4367/6710 train_time:993059ms step_avg:227.40ms step:4368/6710 train_time:993294ms step_avg:227.40ms step:4369/6710 train_time:993530ms step_avg:227.40ms step:4370/6710 train_time:993765ms step_avg:227.41ms step:4371/6710 train_time:993999ms step_avg:227.41ms step:4372/6710 train_time:994234ms step_avg:227.41ms step:4373/6710 train_time:994469ms step_avg:227.41ms step:4374/6710 train_time:994706ms step_avg:227.41ms step:4375/6710 train_time:994941ms step_avg:227.42ms step:4375/6710 val_loss:3.057427 train_time:995129ms step_avg:227.46ms Parameter containing: tensor([1.0000, 1.0000, 0.4083, 1.0000, 0.5350, 1.0000, 0.4432, 1.0000], device='cuda:0', requires_grad=True) 0 [7.61710262298584, 6.617100715637207] 1 [0.4996947944164276, 6.278346061706543] 2 [0.7026287317276001, 4.232677936553955] 3 [0.6877167224884033, 3.552027702331543] 4 [0.37841856479644775, 2.590574026107788] 5 [0.6746205687522888, 3.567650318145752] 6 [0.5072221159934998, 2.541719913482666] 7 [0.722083330154419, 5.38456392288208] 8 [0.462380051612854, 0.8968574404716492] 9 [0.49003148078918457, 2.02406644821167] 10 [0.6377328038215637, 2.642059564590454] 11 [0.44090282917022705, 2.761890411376953] 12 [0.9017164707183838, 6.057564735412598] 13 [1.0060312747955322, 3.3593428134918213] 14 [0.9548230171203613, 1.384568214416504] 15 [0.856067419052124, 0.36812084913253784] 0 [14.23354721069336, 25.354339599609375, 30.950206756591797] 1 [28.607574462890625, 27.192575454711914, 67.16651916503906] 2 [63.33723831176758, 21.928789138793945, 29.237356185913086] 3 [59.352943420410156, 28.710176467895508, 33.71985626220703] 4 [34.564144134521484, 26.172754287719727, 28.37661361694336] 5 [45.58656311035156, 25.259660720825195, 37.4232063293457] 6 [41.343379974365234, 28.715229034423828, 27.83082389831543] 7 [53.70538330078125, 0.0, 41.746768951416016] 8 [36.885929107666016, 29.265016555786133, 43.94486999511719] 9 [52.537113189697266, 25.61316680908203, 35.41073989868164] 10 [70.2943344116211, 26.23868751525879, 34.49726867675781] 11 [55.626312255859375, 32.05971145629883, 20.37080192565918] 12 [80.21626281738281, 25.494272232055664, 21.82773208618164] 13 [105.90403747558594, 19.84889030456543, 26.665714263916016] 14 [116.81566619873047, 23.760963439941406, 36.784996032714844] 15 [118.23936462402344, 80.9956283569336, 133.24082946777344] step:4376/6710 train_time:995179ms step_avg:227.42ms step:4377/6710 train_time:995412ms step_avg:227.42ms step:4378/6710 train_time:995651ms step_avg:227.42ms step:4379/6710 train_time:995886ms step_avg:227.42ms step:4380/6710 train_time:996123ms step_avg:227.43ms step:4381/6710 train_time:996360ms step_avg:227.43ms step:4382/6710 train_time:996598ms step_avg:227.43ms step:4383/6710 train_time:996833ms step_avg:227.43ms step:4384/6710 train_time:997068ms step_avg:227.43ms step:4385/6710 train_time:997303ms step_avg:227.44ms step:4386/6710 train_time:997541ms step_avg:227.44ms step:4387/6710 train_time:997775ms step_avg:227.44ms step:4388/6710 train_time:998009ms step_avg:227.44ms step:4389/6710 train_time:998244ms step_avg:227.44ms step:4390/6710 train_time:998480ms step_avg:227.44ms step:4391/6710 train_time:998714ms step_avg:227.45ms step:4392/6710 train_time:998949ms step_avg:227.45ms step:4393/6710 train_time:999182ms step_avg:227.45ms step:4394/6710 train_time:999420ms step_avg:227.45ms step:4395/6710 train_time:999655ms step_avg:227.45ms step:4396/6710 train_time:999889ms step_avg:227.45ms step:4397/6710 train_time:1000124ms step_avg:227.46ms step:4398/6710 train_time:1000362ms step_avg:227.46ms step:4399/6710 train_time:1000596ms step_avg:227.46ms step:4400/6710 train_time:1000832ms step_avg:227.46ms step:4401/6710 train_time:1001067ms step_avg:227.46ms step:4402/6710 train_time:1001304ms step_avg:227.47ms step:4403/6710 train_time:1001540ms step_avg:227.47ms step:4404/6710 train_time:1001775ms step_avg:227.47ms step:4405/6710 train_time:1002010ms step_avg:227.47ms step:4406/6710 train_time:1002246ms step_avg:227.47ms step:4407/6710 train_time:1002482ms step_avg:227.47ms step:4408/6710 train_time:1002717ms step_avg:227.48ms step:4409/6710 train_time:1002952ms step_avg:227.48ms step:4410/6710 train_time:1003186ms step_avg:227.48ms step:4411/6710 train_time:1003421ms step_avg:227.48ms step:4412/6710 train_time:1003658ms step_avg:227.48ms step:4413/6710 train_time:1003892ms step_avg:227.49ms step:4414/6710 train_time:1004126ms step_avg:227.49ms step:4415/6710 train_time:1004361ms step_avg:227.49ms step:4416/6710 train_time:1004596ms step_avg:227.49ms step:4417/6710 train_time:1004830ms step_avg:227.49ms step:4418/6710 train_time:1005066ms step_avg:227.49ms step:4419/6710 train_time:1005301ms step_avg:227.50ms step:4420/6710 train_time:1005536ms step_avg:227.50ms step:4421/6710 train_time:1005769ms step_avg:227.50ms step:4422/6710 train_time:1006005ms step_avg:227.50ms step:4423/6710 train_time:1006239ms step_avg:227.50ms step:4424/6710 train_time:1006474ms step_avg:227.50ms step:4425/6710 train_time:1006708ms step_avg:227.50ms step:4426/6710 train_time:1006944ms step_avg:227.51ms step:4427/6710 train_time:1007178ms step_avg:227.51ms step:4428/6710 train_time:1007412ms step_avg:227.51ms step:4429/6710 train_time:1007649ms step_avg:227.51ms step:4430/6710 train_time:1007884ms step_avg:227.51ms step:4431/6710 train_time:1008120ms step_avg:227.52ms step:4432/6710 train_time:1008354ms step_avg:227.52ms step:4433/6710 train_time:1008588ms step_avg:227.52ms step:4434/6710 train_time:1008824ms step_avg:227.52ms step:4435/6710 train_time:1009060ms step_avg:227.52ms step:4436/6710 train_time:1009295ms step_avg:227.52ms step:4437/6710 train_time:1009532ms step_avg:227.53ms step:4438/6710 train_time:1009771ms step_avg:227.53ms step:4439/6710 train_time:1010006ms step_avg:227.53ms step:4440/6710 train_time:1010241ms step_avg:227.53ms step:4441/6710 train_time:1010476ms step_avg:227.53ms step:4442/6710 train_time:1010710ms step_avg:227.53ms step:4443/6710 train_time:1010945ms step_avg:227.54ms step:4444/6710 train_time:1011180ms step_avg:227.54ms step:4445/6710 train_time:1011413ms step_avg:227.54ms step:4446/6710 train_time:1011648ms step_avg:227.54ms step:4447/6710 train_time:1011882ms step_avg:227.54ms step:4448/6710 train_time:1012119ms step_avg:227.54ms step:4449/6710 train_time:1012352ms step_avg:227.55ms step:4450/6710 train_time:1012587ms step_avg:227.55ms step:4451/6710 train_time:1012823ms step_avg:227.55ms step:4452/6710 train_time:1013058ms step_avg:227.55ms step:4453/6710 train_time:1013293ms step_avg:227.55ms step:4454/6710 train_time:1013527ms step_avg:227.55ms step:4455/6710 train_time:1013762ms step_avg:227.56ms step:4456/6710 train_time:1013999ms step_avg:227.56ms step:4457/6710 train_time:1014234ms step_avg:227.56ms step:4458/6710 train_time:1014473ms step_avg:227.56ms step:4459/6710 train_time:1014707ms step_avg:227.56ms step:4460/6710 train_time:1014944ms step_avg:227.57ms step:4461/6710 train_time:1015182ms step_avg:227.57ms step:4462/6710 train_time:1015418ms step_avg:227.57ms step:4463/6710 train_time:1015652ms step_avg:227.57ms step:4464/6710 train_time:1015886ms step_avg:227.57ms step:4465/6710 train_time:1016121ms step_avg:227.57ms step:4466/6710 train_time:1016358ms step_avg:227.58ms step:4467/6710 train_time:1016594ms step_avg:227.58ms step:4468/6710 train_time:1016828ms step_avg:227.58ms step:4469/6710 train_time:1017063ms step_avg:227.58ms step:4470/6710 train_time:1017299ms step_avg:227.58ms step:4471/6710 train_time:1017534ms step_avg:227.59ms step:4472/6710 train_time:1017773ms step_avg:227.59ms step:4473/6710 train_time:1018007ms step_avg:227.59ms step:4474/6710 train_time:1018244ms step_avg:227.59ms step:4475/6710 train_time:1018480ms step_avg:227.59ms step:4476/6710 train_time:1018718ms step_avg:227.60ms step:4477/6710 train_time:1018952ms step_avg:227.60ms step:4478/6710 train_time:1019189ms step_avg:227.60ms step:4479/6710 train_time:1019427ms step_avg:227.60ms step:4480/6710 train_time:1019669ms step_avg:227.60ms step:4481/6710 train_time:1019906ms step_avg:227.61ms step:4482/6710 train_time:1020144ms step_avg:227.61ms step:4483/6710 train_time:1020382ms step_avg:227.61ms step:4484/6710 train_time:1020620ms step_avg:227.61ms step:4485/6710 train_time:1020863ms step_avg:227.62ms step:4486/6710 train_time:1021103ms step_avg:227.62ms step:4487/6710 train_time:1021341ms step_avg:227.62ms step:4488/6710 train_time:1021582ms step_avg:227.63ms step:4489/6710 train_time:1021820ms step_avg:227.63ms step:4490/6710 train_time:1022058ms step_avg:227.63ms step:4491/6710 train_time:1022298ms step_avg:227.63ms step:4492/6710 train_time:1022535ms step_avg:227.63ms step:4493/6710 train_time:1022772ms step_avg:227.64ms step:4494/6710 train_time:1023011ms step_avg:227.64ms step:4495/6710 train_time:1023249ms step_avg:227.64ms step:4496/6710 train_time:1023490ms step_avg:227.64ms step:4497/6710 train_time:1023728ms step_avg:227.65ms step:4498/6710 train_time:1023966ms step_avg:227.65ms step:4499/6710 train_time:1024204ms step_avg:227.65ms step:4500/6710 train_time:1024444ms step_avg:227.65ms step:4500/6710 val_loss:3.048243 train_time:1024635ms step_avg:227.70ms Parameter containing: tensor([1.0000, 1.0000, 0.4062, 1.0000, 0.5265, 1.0000, 0.4391, 1.0000], device='cuda:0', requires_grad=True) 0 [7.573484420776367, 6.573482513427734] 1 [0.5018653869628906, 6.194102764129639] 2 [0.6960029602050781, 4.121349811553955] 3 [0.6878643035888672, 3.443119525909424] 4 [0.3769089877605438, 2.516350746154785] 5 [0.6583217978477478, 3.444605588912964] 6 [0.5095053911209106, 2.4533636569976807] 7 [0.7259436845779419, 5.292384624481201] 8 [0.46582886576652527, 0.8026676177978516] 9 [0.4865780770778656, 1.9634754657745361] 10 [0.6385987401008606, 2.578284740447998] 11 [0.4466840922832489, 2.690459966659546] 12 [0.8985665440559387, 5.983011722564697] 13 [1.0021554231643677, 3.295344114303589] 14 [0.9486892223358154, 1.2921538352966309] 15 [0.8638014793395996, 0.26729199290275574] 0 [14.148778915405273, 25.047941207885742, 31.087793350219727] 1 [28.504304885864258, 26.63751220703125, 68.16253662109375] 2 [63.08481979370117, 21.29092025756836, 28.42336082458496] 3 [58.539390563964844, 27.792200088500977, 33.411705017089844] 4 [33.81877899169922, 25.662729263305664, 28.110057830810547] 5 [43.70924377441406, 24.831666946411133, 36.58344268798828] 6 [40.18246841430664, 28.06322479248047, 27.3726749420166] 7 [52.591243743896484, 0.0, 40.600685119628906] 8 [36.207637786865234, 28.591094970703125, 42.72610855102539] 9 [50.76636505126953, 24.92730712890625, 34.5374641418457] 10 [68.0647201538086, 25.740140914916992, 33.58879470825195] 11 [54.68410110473633, 31.47241973876953, 20.159893035888672] 12 [78.53510284423828, 25.199016571044922, 21.610797882080078] 13 [103.53269958496094, 19.352848052978516, 25.954605102539062] 14 [113.4186782836914, 23.02685546875, 35.66869354248047] 15 [115.66864776611328, 79.32354736328125, 132.74073791503906] step:4501/6710 train_time:1024686ms step_avg:227.66ms step:4502/6710 train_time:1024921ms step_avg:227.66ms step:4503/6710 train_time:1025160ms step_avg:227.66ms step:4504/6710 train_time:1025397ms step_avg:227.66ms step:4505/6710 train_time:1025637ms step_avg:227.67ms step:4506/6710 train_time:1025875ms step_avg:227.67ms step:4507/6710 train_time:1026113ms step_avg:227.67ms step:4508/6710 train_time:1026352ms step_avg:227.67ms step:4509/6710 train_time:1026588ms step_avg:227.68ms step:4510/6710 train_time:1026825ms step_avg:227.68ms step:4511/6710 train_time:1027061ms step_avg:227.68ms step:4512/6710 train_time:1027297ms step_avg:227.68ms step:4513/6710 train_time:1027535ms step_avg:227.68ms step:4514/6710 train_time:1027772ms step_avg:227.69ms step:4515/6710 train_time:1028011ms step_avg:227.69ms step:4516/6710 train_time:1028250ms step_avg:227.69ms step:4517/6710 train_time:1028488ms step_avg:227.69ms step:4518/6710 train_time:1028723ms step_avg:227.69ms step:4519/6710 train_time:1028959ms step_avg:227.70ms step:4520/6710 train_time:1029196ms step_avg:227.70ms step:4521/6710 train_time:1029435ms step_avg:227.70ms step:4522/6710 train_time:1029674ms step_avg:227.70ms step:4523/6710 train_time:1029911ms step_avg:227.71ms step:4524/6710 train_time:1030148ms step_avg:227.71ms step:4525/6710 train_time:1030385ms step_avg:227.71ms step:4526/6710 train_time:1030624ms step_avg:227.71ms step:4527/6710 train_time:1030861ms step_avg:227.71ms step:4528/6710 train_time:1031100ms step_avg:227.72ms step:4529/6710 train_time:1031339ms step_avg:227.72ms step:4530/6710 train_time:1031580ms step_avg:227.72ms step:4531/6710 train_time:1031816ms step_avg:227.72ms step:4532/6710 train_time:1032056ms step_avg:227.73ms step:4533/6710 train_time:1032297ms step_avg:227.73ms step:4534/6710 train_time:1032534ms step_avg:227.73ms step:4535/6710 train_time:1032772ms step_avg:227.73ms step:4536/6710 train_time:1033008ms step_avg:227.74ms step:4537/6710 train_time:1033247ms step_avg:227.74ms step:4538/6710 train_time:1033484ms step_avg:227.74ms step:4539/6710 train_time:1033724ms step_avg:227.74ms step:4540/6710 train_time:1033960ms step_avg:227.74ms step:4541/6710 train_time:1034202ms step_avg:227.75ms step:4542/6710 train_time:1034439ms step_avg:227.75ms step:4543/6710 train_time:1034677ms step_avg:227.75ms step:4544/6710 train_time:1034913ms step_avg:227.75ms step:4545/6710 train_time:1035152ms step_avg:227.76ms step:4546/6710 train_time:1035391ms step_avg:227.76ms step:4547/6710 train_time:1035628ms step_avg:227.76ms step:4548/6710 train_time:1035866ms step_avg:227.76ms step:4549/6710 train_time:1036102ms step_avg:227.76ms step:4550/6710 train_time:1036342ms step_avg:227.77ms step:4551/6710 train_time:1036578ms step_avg:227.77ms step:4552/6710 train_time:1036817ms step_avg:227.77ms step:4553/6710 train_time:1037055ms step_avg:227.77ms step:4554/6710 train_time:1037294ms step_avg:227.78ms step:4555/6710 train_time:1037531ms step_avg:227.78ms step:4556/6710 train_time:1037767ms step_avg:227.78ms step:4557/6710 train_time:1038004ms step_avg:227.78ms step:4558/6710 train_time:1038243ms step_avg:227.78ms step:4559/6710 train_time:1038480ms step_avg:227.79ms step:4560/6710 train_time:1038718ms step_avg:227.79ms step:4561/6710 train_time:1038955ms step_avg:227.79ms step:4562/6710 train_time:1039194ms step_avg:227.79ms step:4563/6710 train_time:1039434ms step_avg:227.80ms step:4564/6710 train_time:1039673ms step_avg:227.80ms step:4565/6710 train_time:1039912ms step_avg:227.80ms step:4566/6710 train_time:1040149ms step_avg:227.80ms step:4567/6710 train_time:1040387ms step_avg:227.81ms step:4568/6710 train_time:1040626ms step_avg:227.81ms step:4569/6710 train_time:1040862ms step_avg:227.81ms step:4570/6710 train_time:1041097ms step_avg:227.81ms step:4571/6710 train_time:1041338ms step_avg:227.81ms step:4572/6710 train_time:1041576ms step_avg:227.82ms step:4573/6710 train_time:1041814ms step_avg:227.82ms step:4574/6710 train_time:1042054ms step_avg:227.82ms step:4575/6710 train_time:1042295ms step_avg:227.82ms step:4576/6710 train_time:1042532ms step_avg:227.83ms step:4577/6710 train_time:1042770ms step_avg:227.83ms step:4578/6710 train_time:1043010ms step_avg:227.83ms step:4579/6710 train_time:1043247ms step_avg:227.83ms step:4580/6710 train_time:1043485ms step_avg:227.84ms step:4581/6710 train_time:1043728ms step_avg:227.84ms step:4582/6710 train_time:1043962ms step_avg:227.84ms step:4583/6710 train_time:1044198ms step_avg:227.84ms step:4584/6710 train_time:1044436ms step_avg:227.84ms step:4585/6710 train_time:1044676ms step_avg:227.85ms step:4586/6710 train_time:1044916ms step_avg:227.85ms step:4587/6710 train_time:1045150ms step_avg:227.85ms step:4588/6710 train_time:1045389ms step_avg:227.85ms step:4589/6710 train_time:1045626ms step_avg:227.85ms step:4590/6710 train_time:1045865ms step_avg:227.86ms step:4591/6710 train_time:1046104ms step_avg:227.86ms step:4592/6710 train_time:1046341ms step_avg:227.86ms step:4593/6710 train_time:1046580ms step_avg:227.86ms step:4594/6710 train_time:1046817ms step_avg:227.87ms step:4595/6710 train_time:1047053ms step_avg:227.87ms step:4596/6710 train_time:1047296ms step_avg:227.87ms step:4597/6710 train_time:1047538ms step_avg:227.87ms step:4598/6710 train_time:1047775ms step_avg:227.88ms step:4599/6710 train_time:1048014ms step_avg:227.88ms step:4600/6710 train_time:1048252ms step_avg:227.88ms step:4601/6710 train_time:1048490ms step_avg:227.88ms step:4602/6710 train_time:1048726ms step_avg:227.88ms step:4603/6710 train_time:1048965ms step_avg:227.89ms step:4604/6710 train_time:1049204ms step_avg:227.89ms step:4605/6710 train_time:1049443ms step_avg:227.89ms step:4606/6710 train_time:1049678ms step_avg:227.89ms step:4607/6710 train_time:1049915ms step_avg:227.90ms step:4608/6710 train_time:1050157ms step_avg:227.90ms step:4609/6710 train_time:1050395ms step_avg:227.90ms step:4610/6710 train_time:1050635ms step_avg:227.90ms step:4611/6710 train_time:1050873ms step_avg:227.91ms step:4612/6710 train_time:1051112ms step_avg:227.91ms step:4613/6710 train_time:1051351ms step_avg:227.91ms step:4614/6710 train_time:1051589ms step_avg:227.91ms step:4615/6710 train_time:1051828ms step_avg:227.91ms step:4616/6710 train_time:1052069ms step_avg:227.92ms step:4617/6710 train_time:1052307ms step_avg:227.92ms step:4618/6710 train_time:1052541ms step_avg:227.92ms step:4619/6710 train_time:1052778ms step_avg:227.92ms step:4620/6710 train_time:1053016ms step_avg:227.93ms step:4621/6710 train_time:1053255ms step_avg:227.93ms step:4622/6710 train_time:1053491ms step_avg:227.93ms step:4623/6710 train_time:1053731ms step_avg:227.93ms step:4624/6710 train_time:1053967ms step_avg:227.93ms step:4625/6710 train_time:1054206ms step_avg:227.94ms step:4625/6710 val_loss:3.038444 train_time:1054393ms step_avg:227.98ms Parameter containing: tensor([1.0000, 1.0000, 0.4064, 1.0000, 0.5213, 1.0000, 0.4348, 1.0000], device='cuda:0', requires_grad=True) 0 [7.551105976104736, 6.5511040687561035] 1 [0.5009860396385193, 6.132352352142334] 2 [0.6903342008590698, 4.012848854064941] 3 [0.6754482984542847, 3.3597638607025146] 4 [0.3852398693561554, 2.472730875015259] 5 [0.6489765048027039, 3.342377185821533] 6 [0.5184406638145447, 2.3497507572174072] 7 [0.7156690955162048, 5.202853202819824] 8 [0.47048014402389526, 0.732533872127533] 9 [0.49187737703323364, 1.89407217502594] 10 [0.6367177963256836, 2.5128047466278076] 11 [0.446974515914917, 2.6205763816833496] 12 [0.8931507468223572, 5.912843227386475] 13 [0.9919220805168152, 3.2409474849700928] 14 [0.946326494216919, 1.221722960472107] 15 [0.867372453212738, 0.16379082202911377] 0 [14.10338306427002, 24.52924919128418, 30.702672958374023] 1 [28.057146072387695, 26.216796875, 66.21002960205078] 2 [61.040611267089844, 21.04997444152832, 27.9575252532959] 3 [55.98112487792969, 27.39457130432129, 32.75975799560547] 4 [33.39092254638672, 25.272262573242188, 27.81203842163086] 5 [42.457427978515625, 24.21088409423828, 35.87007141113281] 6 [39.76518249511719, 27.36322784423828, 27.006515502929688] 7 [51.00477600097656, 0.0, 39.778629302978516] 8 [35.617889404296875, 27.8446044921875, 41.8837776184082] 9 [50.11343765258789, 24.439546585083008, 34.1210823059082] 10 [66.64632415771484, 25.259645462036133, 33.465309143066406] 11 [53.64426803588867, 30.929168701171875, 19.974206924438477] 12 [76.63539123535156, 24.718324661254883, 21.275623321533203] 13 [99.99404907226562, 19.014101028442383, 25.319067001342773] 14 [109.44085693359375, 22.34588623046875, 34.44697570800781] 15 [112.13289642333984, 77.2568359375, 126.64970397949219] step:4626/6710 train_time:1054445ms step_avg:227.94ms step:4627/6710 train_time:1054679ms step_avg:227.94ms step:4628/6710 train_time:1054923ms step_avg:227.94ms step:4629/6710 train_time:1055157ms step_avg:227.94ms step:4630/6710 train_time:1055398ms step_avg:227.95ms step:4631/6710 train_time:1055634ms step_avg:227.95ms step:4632/6710 train_time:1055873ms step_avg:227.95ms step:4633/6710 train_time:1056110ms step_avg:227.95ms step:4634/6710 train_time:1056349ms step_avg:227.96ms step:4635/6710 train_time:1056586ms step_avg:227.96ms step:4636/6710 train_time:1056826ms step_avg:227.96ms step:4637/6710 train_time:1057063ms step_avg:227.96ms step:4638/6710 train_time:1057301ms step_avg:227.96ms step:4639/6710 train_time:1057541ms step_avg:227.97ms step:4640/6710 train_time:1057781ms step_avg:227.97ms step:4641/6710 train_time:1058021ms step_avg:227.97ms step:4642/6710 train_time:1058259ms step_avg:227.97ms step:4643/6710 train_time:1058496ms step_avg:227.98ms step:4644/6710 train_time:1058740ms step_avg:227.98ms step:4645/6710 train_time:1058979ms step_avg:227.98ms step:4646/6710 train_time:1059214ms step_avg:227.98ms step:4647/6710 train_time:1059450ms step_avg:227.99ms step:4648/6710 train_time:1059690ms step_avg:227.99ms step:4649/6710 train_time:1059931ms step_avg:227.99ms step:4650/6710 train_time:1060170ms step_avg:227.99ms step:4651/6710 train_time:1060407ms step_avg:228.00ms step:4652/6710 train_time:1060644ms step_avg:228.00ms step:4653/6710 train_time:1060882ms step_avg:228.00ms step:4654/6710 train_time:1061121ms step_avg:228.00ms step:4655/6710 train_time:1061359ms step_avg:228.00ms step:4656/6710 train_time:1061597ms step_avg:228.01ms step:4657/6710 train_time:1061836ms step_avg:228.01ms step:4658/6710 train_time:1062073ms step_avg:228.01ms step:4659/6710 train_time:1062313ms step_avg:228.01ms step:4660/6710 train_time:1062549ms step_avg:228.01ms step:4661/6710 train_time:1062785ms step_avg:228.02ms step:4662/6710 train_time:1063023ms step_avg:228.02ms step:4663/6710 train_time:1063263ms step_avg:228.02ms step:4664/6710 train_time:1063502ms step_avg:228.02ms step:4665/6710 train_time:1063741ms step_avg:228.03ms step:4666/6710 train_time:1063980ms step_avg:228.03ms step:4667/6710 train_time:1064218ms step_avg:228.03ms step:4668/6710 train_time:1064455ms step_avg:228.03ms step:4669/6710 train_time:1064693ms step_avg:228.03ms step:4670/6710 train_time:1064931ms step_avg:228.04ms step:4671/6710 train_time:1065169ms step_avg:228.04ms step:4672/6710 train_time:1065408ms step_avg:228.04ms step:4673/6710 train_time:1065644ms step_avg:228.04ms step:4674/6710 train_time:1065882ms step_avg:228.04ms step:4675/6710 train_time:1066121ms step_avg:228.05ms step:4676/6710 train_time:1066359ms step_avg:228.05ms step:4677/6710 train_time:1066597ms step_avg:228.05ms step:4678/6710 train_time:1066834ms step_avg:228.05ms step:4679/6710 train_time:1067074ms step_avg:228.06ms step:4680/6710 train_time:1067313ms step_avg:228.06ms step:4681/6710 train_time:1067554ms step_avg:228.06ms step:4682/6710 train_time:1067792ms step_avg:228.06ms step:4683/6710 train_time:1068033ms step_avg:228.07ms step:4684/6710 train_time:1068270ms step_avg:228.07ms step:4685/6710 train_time:1068508ms step_avg:228.07ms step:4686/6710 train_time:1068746ms step_avg:228.07ms step:4687/6710 train_time:1068985ms step_avg:228.07ms step:4688/6710 train_time:1069225ms step_avg:228.08ms step:4689/6710 train_time:1069464ms step_avg:228.08ms step:4690/6710 train_time:1069702ms step_avg:228.08ms step:4691/6710 train_time:1069940ms step_avg:228.08ms step:4692/6710 train_time:1070178ms step_avg:228.09ms step:4693/6710 train_time:1070417ms step_avg:228.09ms step:4694/6710 train_time:1070657ms step_avg:228.09ms step:4695/6710 train_time:1070895ms step_avg:228.09ms step:4696/6710 train_time:1071133ms step_avg:228.09ms step:4697/6710 train_time:1071370ms step_avg:228.10ms step:4698/6710 train_time:1071606ms step_avg:228.10ms step:4699/6710 train_time:1071845ms step_avg:228.10ms step:4700/6710 train_time:1072083ms step_avg:228.10ms step:4701/6710 train_time:1072321ms step_avg:228.10ms step:4702/6710 train_time:1072561ms step_avg:228.11ms step:4703/6710 train_time:1072796ms step_avg:228.11ms step:4704/6710 train_time:1073035ms step_avg:228.11ms step:4705/6710 train_time:1073271ms step_avg:228.11ms step:4706/6710 train_time:1073510ms step_avg:228.12ms step:4707/6710 train_time:1073751ms step_avg:228.12ms step:4708/6710 train_time:1073988ms step_avg:228.12ms step:4709/6710 train_time:1074225ms step_avg:228.12ms step:4710/6710 train_time:1074467ms step_avg:228.12ms step:4711/6710 train_time:1074704ms step_avg:228.13ms step:4712/6710 train_time:1074941ms step_avg:228.13ms step:4713/6710 train_time:1075179ms step_avg:228.13ms step:4714/6710 train_time:1075417ms step_avg:228.13ms step:4715/6710 train_time:1075656ms step_avg:228.13ms step:4716/6710 train_time:1075894ms step_avg:228.14ms step:4717/6710 train_time:1076133ms step_avg:228.14ms step:4718/6710 train_time:1076372ms step_avg:228.14ms step:4719/6710 train_time:1076610ms step_avg:228.14ms step:4720/6710 train_time:1076846ms step_avg:228.15ms step:4721/6710 train_time:1077082ms step_avg:228.15ms step:4722/6710 train_time:1077320ms step_avg:228.15ms step:4723/6710 train_time:1077559ms step_avg:228.15ms step:4724/6710 train_time:1077796ms step_avg:228.15ms step:4725/6710 train_time:1078037ms step_avg:228.16ms step:4726/6710 train_time:1078278ms step_avg:228.16ms step:4727/6710 train_time:1078515ms step_avg:228.16ms step:4728/6710 train_time:1078751ms step_avg:228.16ms step:4729/6710 train_time:1078988ms step_avg:228.16ms step:4730/6710 train_time:1079225ms step_avg:228.17ms step:4731/6710 train_time:1079464ms step_avg:228.17ms step:4732/6710 train_time:1079701ms step_avg:228.17ms step:4733/6710 train_time:1079940ms step_avg:228.17ms step:4734/6710 train_time:1080176ms step_avg:228.17ms step:4735/6710 train_time:1080413ms step_avg:228.18ms step:4736/6710 train_time:1080649ms step_avg:228.18ms step:4737/6710 train_time:1080885ms step_avg:228.18ms step:4738/6710 train_time:1081125ms step_avg:228.18ms step:4739/6710 train_time:1081366ms step_avg:228.18ms step:4740/6710 train_time:1081606ms step_avg:228.19ms step:4741/6710 train_time:1081844ms step_avg:228.19ms step:4742/6710 train_time:1082085ms step_avg:228.19ms step:4743/6710 train_time:1082323ms step_avg:228.19ms step:4744/6710 train_time:1082560ms step_avg:228.20ms step:4745/6710 train_time:1082797ms step_avg:228.20ms step:4746/6710 train_time:1083034ms step_avg:228.20ms step:4747/6710 train_time:1083274ms step_avg:228.20ms step:4748/6710 train_time:1083514ms step_avg:228.20ms step:4749/6710 train_time:1083751ms step_avg:228.21ms step:4750/6710 train_time:1083987ms step_avg:228.21ms step:4750/6710 val_loss:3.029505 train_time:1084173ms step_avg:228.25ms Parameter containing: tensor([1.0000, 1.0000, 0.4097, 1.0000, 0.5127, 1.0000, 0.4260, 1.0000], device='cuda:0', requires_grad=True) 0 [7.510849952697754, 6.510848045349121] 1 [0.49861282110214233, 6.070657730102539] 2 [0.6766057014465332, 3.901515483856201] 3 [0.6780496835708618, 3.2807912826538086] 4 [0.3879418969154358, 2.4233763217926025] 5 [0.6496724486351013, 3.2804319858551025] 6 [0.5154710412025452, 2.285400629043579] 7 [0.7128025889396667, 5.117234230041504] 8 [0.47661492228507996, 0.6702328324317932] 9 [0.491907000541687, 1.8234449625015259] 10 [0.635995090007782, 2.4457552433013916] 11 [0.4519791007041931, 2.5498383045196533] 12 [0.8848716616630554, 5.820878982543945] 13 [0.9857457876205444, 3.1806092262268066] 14 [0.9429733753204346, 1.1592366695404053] 15 [0.8701980113983154, 0.0899469405412674] 0 [14.024210929870605, 24.154834747314453, 30.475296020507812] 1 [27.644250869750977, 25.584585189819336, 64.88185119628906] 2 [58.62731170654297, 20.692378997802734, 27.543338775634766] 3 [54.391517639160156, 26.82432746887207, 32.20224380493164] 4 [32.79872512817383, 24.75229835510254, 27.914888381958008] 5 [41.92262268066406, 23.89447021484375, 35.209716796875] 6 [38.97556686401367, 26.96858024597168, 26.600542068481445] 7 [49.89175796508789, 0.0, 38.626956939697266] 8 [35.1575927734375, 27.323781967163086, 41.095001220703125] 9 [48.98686218261719, 23.965133666992188, 33.68289566040039] 10 [65.08655548095703, 24.81426429748535, 32.86759948730469] 11 [53.004032135009766, 30.334396362304688, 19.967090606689453] 12 [74.961181640625, 24.505569458007812, 21.113298416137695] 13 [97.58367156982422, 18.347139358520508, 24.953187942504883] 14 [106.54208374023438, 21.403549194335938, 33.94085693359375] 15 [109.5255355834961, 75.02759552001953, 123.1218490600586] step:4751/6710 train_time:1084374ms step_avg:228.24ms step:4752/6710 train_time:1084607ms step_avg:228.24ms step:4753/6710 train_time:1084841ms step_avg:228.24ms step:4754/6710 train_time:1085077ms step_avg:228.24ms step:4755/6710 train_time:1085320ms step_avg:228.25ms step:4756/6710 train_time:1085560ms step_avg:228.25ms step:4757/6710 train_time:1085796ms step_avg:228.25ms step:4758/6710 train_time:1086034ms step_avg:228.25ms step:4759/6710 train_time:1086273ms step_avg:228.26ms step:4760/6710 train_time:1086512ms step_avg:228.26ms step:4761/6710 train_time:1086749ms step_avg:228.26ms step:4762/6710 train_time:1086984ms step_avg:228.26ms step:4763/6710 train_time:1087223ms step_avg:228.26ms step:4764/6710 train_time:1087464ms step_avg:228.27ms step:4765/6710 train_time:1087702ms step_avg:228.27ms step:4766/6710 train_time:1087941ms step_avg:228.27ms step:4767/6710 train_time:1088179ms step_avg:228.27ms step:4768/6710 train_time:1088415ms step_avg:228.27ms step:4769/6710 train_time:1088653ms step_avg:228.28ms step:4770/6710 train_time:1088890ms step_avg:228.28ms step:4771/6710 train_time:1089128ms step_avg:228.28ms step:4772/6710 train_time:1089366ms step_avg:228.28ms step:4773/6710 train_time:1089605ms step_avg:228.29ms step:4774/6710 train_time:1089842ms step_avg:228.29ms step:4775/6710 train_time:1090079ms step_avg:228.29ms step:4776/6710 train_time:1090315ms step_avg:228.29ms step:4777/6710 train_time:1090553ms step_avg:228.29ms step:4778/6710 train_time:1090790ms step_avg:228.29ms step:4779/6710 train_time:1091028ms step_avg:228.30ms step:4780/6710 train_time:1091265ms step_avg:228.30ms step:4781/6710 train_time:1091504ms step_avg:228.30ms step:4782/6710 train_time:1091742ms step_avg:228.30ms step:4783/6710 train_time:1091980ms step_avg:228.30ms step:4784/6710 train_time:1092219ms step_avg:228.31ms step:4785/6710 train_time:1092457ms step_avg:228.31ms step:4786/6710 train_time:1092696ms step_avg:228.31ms step:4787/6710 train_time:1092933ms step_avg:228.31ms step:4788/6710 train_time:1093174ms step_avg:228.32ms step:4789/6710 train_time:1093418ms step_avg:228.32ms step:4790/6710 train_time:1093654ms step_avg:228.32ms step:4791/6710 train_time:1093895ms step_avg:228.32ms step:4792/6710 train_time:1094133ms step_avg:228.32ms step:4793/6710 train_time:1094373ms step_avg:228.33ms step:4794/6710 train_time:1094610ms step_avg:228.33ms step:4795/6710 train_time:1094849ms step_avg:228.33ms step:4796/6710 train_time:1095087ms step_avg:228.33ms step:4797/6710 train_time:1095326ms step_avg:228.34ms step:4798/6710 train_time:1095566ms step_avg:228.34ms step:4799/6710 train_time:1095802ms step_avg:228.34ms step:4800/6710 train_time:1096039ms step_avg:228.34ms step:4801/6710 train_time:1096279ms step_avg:228.34ms step:4802/6710 train_time:1096517ms step_avg:228.35ms step:4803/6710 train_time:1096755ms step_avg:228.35ms step:4804/6710 train_time:1096993ms step_avg:228.35ms step:4805/6710 train_time:1097233ms step_avg:228.35ms step:4806/6710 train_time:1097471ms step_avg:228.35ms step:4807/6710 train_time:1097712ms step_avg:228.36ms step:4808/6710 train_time:1097950ms step_avg:228.36ms step:4809/6710 train_time:1098188ms step_avg:228.36ms step:4810/6710 train_time:1098426ms step_avg:228.36ms step:4811/6710 train_time:1098663ms step_avg:228.36ms step:4812/6710 train_time:1098901ms step_avg:228.37ms step:4813/6710 train_time:1099139ms step_avg:228.37ms step:4814/6710 train_time:1099377ms step_avg:228.37ms step:4815/6710 train_time:1099616ms step_avg:228.37ms step:4816/6710 train_time:1099852ms step_avg:228.37ms step:4817/6710 train_time:1100094ms step_avg:228.38ms step:4818/6710 train_time:1100332ms step_avg:228.38ms step:4819/6710 train_time:1100569ms step_avg:228.38ms step:4820/6710 train_time:1100807ms step_avg:228.38ms step:4821/6710 train_time:1101046ms step_avg:228.39ms step:4822/6710 train_time:1101287ms step_avg:228.39ms step:4823/6710 train_time:1101525ms step_avg:228.39ms step:4824/6710 train_time:1101764ms step_avg:228.39ms step:4825/6710 train_time:1102002ms step_avg:228.39ms step:4826/6710 train_time:1102240ms step_avg:228.40ms step:4827/6710 train_time:1102478ms step_avg:228.40ms step:4828/6710 train_time:1102714ms step_avg:228.40ms step:4829/6710 train_time:1102951ms step_avg:228.40ms step:4830/6710 train_time:1103191ms step_avg:228.40ms step:4831/6710 train_time:1103426ms step_avg:228.41ms step:4832/6710 train_time:1103664ms step_avg:228.41ms step:4833/6710 train_time:1103901ms step_avg:228.41ms step:4834/6710 train_time:1104139ms step_avg:228.41ms step:4835/6710 train_time:1104375ms step_avg:228.41ms step:4836/6710 train_time:1104616ms step_avg:228.42ms step:4837/6710 train_time:1104854ms step_avg:228.42ms step:4838/6710 train_time:1105092ms step_avg:228.42ms step:4839/6710 train_time:1105330ms step_avg:228.42ms step:4840/6710 train_time:1105569ms step_avg:228.42ms step:4841/6710 train_time:1105809ms step_avg:228.43ms step:4842/6710 train_time:1106047ms step_avg:228.43ms step:4843/6710 train_time:1106284ms step_avg:228.43ms step:4844/6710 train_time:1106521ms step_avg:228.43ms step:4845/6710 train_time:1106757ms step_avg:228.43ms step:4846/6710 train_time:1106995ms step_avg:228.43ms step:4847/6710 train_time:1107234ms step_avg:228.44ms step:4848/6710 train_time:1107473ms step_avg:228.44ms step:4849/6710 train_time:1107713ms step_avg:228.44ms step:4850/6710 train_time:1107950ms step_avg:228.44ms step:4851/6710 train_time:1108189ms step_avg:228.45ms step:4852/6710 train_time:1108427ms step_avg:228.45ms step:4853/6710 train_time:1108667ms step_avg:228.45ms step:4854/6710 train_time:1108905ms step_avg:228.45ms step:4855/6710 train_time:1109144ms step_avg:228.45ms step:4856/6710 train_time:1109382ms step_avg:228.46ms step:4857/6710 train_time:1109619ms step_avg:228.46ms step:4858/6710 train_time:1109855ms step_avg:228.46ms step:4859/6710 train_time:1110093ms step_avg:228.46ms step:4860/6710 train_time:1110335ms step_avg:228.46ms step:4861/6710 train_time:1110573ms step_avg:228.47ms step:4862/6710 train_time:1110811ms step_avg:228.47ms step:4863/6710 train_time:1111049ms step_avg:228.47ms step:4864/6710 train_time:1111287ms step_avg:228.47ms step:4865/6710 train_time:1111523ms step_avg:228.47ms step:4866/6710 train_time:1111760ms step_avg:228.48ms step:4867/6710 train_time:1112000ms step_avg:228.48ms step:4868/6710 train_time:1112236ms step_avg:228.48ms step:4869/6710 train_time:1112472ms step_avg:228.48ms step:4870/6710 train_time:1112710ms step_avg:228.48ms step:4871/6710 train_time:1112949ms step_avg:228.48ms step:4872/6710 train_time:1113188ms step_avg:228.49ms step:4873/6710 train_time:1113428ms step_avg:228.49ms step:4874/6710 train_time:1113667ms step_avg:228.49ms step:4875/6710 train_time:1113904ms step_avg:228.49ms step:4875/6710 val_loss:3.021799 train_time:1114091ms step_avg:228.53ms Parameter containing: tensor([1.0000, 1.0000, 0.4111, 1.0000, 0.5077, 1.0000, 0.4111, 1.0000], device='cuda:0', requires_grad=True) 0 [7.464210033416748, 6.464208126068115] 1 [0.49236711859703064, 5.986398696899414] 2 [0.6662137508392334, 3.7942192554473877] 3 [0.6806812882423401, 3.2047622203826904] 4 [0.3887662887573242, 2.359968423843384] 5 [0.6396349668502808, 3.1791062355041504] 6 [0.5167333483695984, 2.1903820037841797] 7 [0.709382951259613, 5.018332481384277] 8 [0.47905299067497253, 0.5761205554008484] 9 [0.49456509947776794, 1.7439780235290527] 10 [0.633223831653595, 2.3669090270996094] 11 [0.4543646574020386, 2.4745826721191406] 12 [0.8837102055549622, 5.731138706207275] 13 [0.9813041090965271, 3.129397392272949] 14 [0.9427030086517334, 1.1137244701385498] 15 [0.8739708662033081, 0.03603116422891617] 0 [13.930967330932617, 23.91343879699707, 29.562057495117188] 1 [26.82398796081543, 25.161949157714844, 63.44724655151367] 2 [56.370765686035156, 20.090490341186523, 26.801210403442383] 3 [52.7080192565918, 26.15617561340332, 31.481807708740234] 4 [31.95477294921875, 24.20561981201172, 27.534236907958984] 5 [40.41724395751953, 23.252300262451172, 34.783851623535156] 6 [38.03203582763672, 26.453487396240234, 26.29572296142578] 7 [48.616397857666016, 0.0, 37.55921173095703] 8 [34.376365661621094, 26.72776222229004, 40.17698669433594] 9 [47.72389221191406, 23.423656463623047, 32.81721878051758] 10 [62.9815559387207, 24.313278198242188, 32.05527877807617] 11 [51.66033935546875, 29.860990524291992, 19.681533813476562] 12 [73.2469482421875, 24.26864242553711, 20.778764724731445] 13 [95.21620178222656, 17.79262351989746, 24.31167984008789] 14 [103.95062255859375, 21.04802703857422, 33.04533767700195] 15 [107.38346862792969, 73.56344604492188, 120.12061309814453] step:4876/6710 train_time:1114142ms step_avg:228.50ms step:4877/6710 train_time:1114379ms step_avg:228.50ms step:4878/6710 train_time:1114624ms step_avg:228.50ms step:4879/6710 train_time:1114857ms step_avg:228.50ms step:4880/6710 train_time:1115097ms step_avg:228.50ms step:4881/6710 train_time:1115334ms step_avg:228.51ms step:4882/6710 train_time:1115575ms step_avg:228.51ms step:4883/6710 train_time:1115813ms step_avg:228.51ms step:4884/6710 train_time:1116051ms step_avg:228.51ms step:4885/6710 train_time:1116291ms step_avg:228.51ms step:4886/6710 train_time:1116529ms step_avg:228.52ms step:4887/6710 train_time:1116769ms step_avg:228.52ms step:4888/6710 train_time:1117008ms step_avg:228.52ms step:4889/6710 train_time:1117243ms step_avg:228.52ms step:4890/6710 train_time:1117479ms step_avg:228.52ms step:4891/6710 train_time:1117718ms step_avg:228.53ms step:4892/6710 train_time:1117957ms step_avg:228.53ms step:4893/6710 train_time:1118194ms step_avg:228.53ms step:4894/6710 train_time:1118432ms step_avg:228.53ms step:4895/6710 train_time:1118669ms step_avg:228.53ms step:4896/6710 train_time:1118908ms step_avg:228.54ms step:4897/6710 train_time:1119144ms step_avg:228.54ms step:4898/6710 train_time:1119385ms step_avg:228.54ms step:4899/6710 train_time:1119621ms step_avg:228.54ms step:4900/6710 train_time:1119861ms step_avg:228.54ms step:4901/6710 train_time:1120102ms step_avg:228.55ms step:4902/6710 train_time:1120339ms step_avg:228.55ms step:4903/6710 train_time:1120576ms step_avg:228.55ms step:4904/6710 train_time:1120815ms step_avg:228.55ms step:4905/6710 train_time:1121054ms step_avg:228.55ms step:4906/6710 train_time:1121294ms step_avg:228.56ms step:4907/6710 train_time:1121532ms step_avg:228.56ms step:4908/6710 train_time:1121770ms step_avg:228.56ms step:4909/6710 train_time:1122006ms step_avg:228.56ms step:4910/6710 train_time:1122244ms step_avg:228.56ms step:4911/6710 train_time:1122482ms step_avg:228.56ms step:4912/6710 train_time:1122720ms step_avg:228.57ms step:4913/6710 train_time:1122957ms step_avg:228.57ms step:4914/6710 train_time:1123196ms step_avg:228.57ms step:4915/6710 train_time:1123433ms step_avg:228.57ms step:4916/6710 train_time:1123671ms step_avg:228.57ms step:4917/6710 train_time:1123909ms step_avg:228.58ms step:4918/6710 train_time:1124145ms step_avg:228.58ms step:4919/6710 train_time:1124387ms step_avg:228.58ms step:4920/6710 train_time:1124623ms step_avg:228.58ms step:4921/6710 train_time:1124860ms step_avg:228.58ms step:4922/6710 train_time:1125095ms step_avg:228.58ms step:4923/6710 train_time:1125333ms step_avg:228.59ms step:4924/6710 train_time:1125571ms step_avg:228.59ms step:4925/6710 train_time:1125810ms step_avg:228.59ms step:4926/6710 train_time:1126046ms step_avg:228.59ms step:4927/6710 train_time:1126284ms step_avg:228.59ms step:4928/6710 train_time:1126522ms step_avg:228.60ms step:4929/6710 train_time:1126759ms step_avg:228.60ms step:4930/6710 train_time:1126996ms step_avg:228.60ms step:4931/6710 train_time:1127233ms step_avg:228.60ms step:4932/6710 train_time:1127471ms step_avg:228.60ms step:4933/6710 train_time:1127712ms step_avg:228.61ms step:4934/6710 train_time:1127952ms step_avg:228.61ms step:4935/6710 train_time:1128188ms step_avg:228.61ms step:4936/6710 train_time:1128429ms step_avg:228.61ms step:4937/6710 train_time:1128668ms step_avg:228.61ms step:4938/6710 train_time:1128905ms step_avg:228.62ms step:4939/6710 train_time:1129145ms step_avg:228.62ms step:4940/6710 train_time:1129384ms step_avg:228.62ms step:4941/6710 train_time:1129621ms step_avg:228.62ms step:4942/6710 train_time:1129858ms step_avg:228.62ms step:4943/6710 train_time:1130095ms step_avg:228.63ms step:4944/6710 train_time:1130334ms step_avg:228.63ms step:4945/6710 train_time:1130576ms step_avg:228.63ms step:4946/6710 train_time:1130814ms step_avg:228.63ms step:4947/6710 train_time:1131050ms step_avg:228.63ms step:4948/6710 train_time:1131288ms step_avg:228.64ms step:4949/6710 train_time:1131526ms step_avg:228.64ms step:4950/6710 train_time:1131764ms step_avg:228.64ms step:4951/6710 train_time:1132000ms step_avg:228.64ms step:4952/6710 train_time:1132239ms step_avg:228.64ms step:4953/6710 train_time:1132477ms step_avg:228.64ms step:4954/6710 train_time:1132713ms step_avg:228.65ms step:4955/6710 train_time:1132955ms step_avg:228.65ms step:4956/6710 train_time:1133194ms step_avg:228.65ms step:4957/6710 train_time:1133431ms step_avg:228.65ms step:4958/6710 train_time:1133669ms step_avg:228.65ms step:4959/6710 train_time:1133909ms step_avg:228.66ms step:4960/6710 train_time:1134145ms step_avg:228.66ms step:4961/6710 train_time:1134381ms step_avg:228.66ms step:4962/6710 train_time:1134619ms step_avg:228.66ms step:4963/6710 train_time:1134856ms step_avg:228.66ms step:4964/6710 train_time:1135097ms step_avg:228.67ms step:4965/6710 train_time:1135336ms step_avg:228.67ms step:4966/6710 train_time:1135578ms step_avg:228.67ms step:4967/6710 train_time:1135816ms step_avg:228.67ms step:4968/6710 train_time:1136058ms step_avg:228.68ms step:4969/6710 train_time:1136297ms step_avg:228.68ms step:4970/6710 train_time:1136533ms step_avg:228.68ms step:4971/6710 train_time:1136772ms step_avg:228.68ms step:4972/6710 train_time:1137009ms step_avg:228.68ms step:4973/6710 train_time:1137251ms step_avg:228.69ms step:4974/6710 train_time:1137490ms step_avg:228.69ms step:4975/6710 train_time:1137727ms step_avg:228.69ms step:4976/6710 train_time:1137964ms step_avg:228.69ms step:4977/6710 train_time:1138203ms step_avg:228.69ms step:4978/6710 train_time:1138443ms step_avg:228.69ms step:4979/6710 train_time:1138682ms step_avg:228.70ms step:4980/6710 train_time:1138920ms step_avg:228.70ms step:4981/6710 train_time:1139161ms step_avg:228.70ms step:4982/6710 train_time:1139400ms step_avg:228.70ms step:4983/6710 train_time:1139637ms step_avg:228.70ms step:4984/6710 train_time:1139874ms step_avg:228.71ms step:4985/6710 train_time:1140113ms step_avg:228.71ms step:4986/6710 train_time:1140352ms step_avg:228.71ms step:4987/6710 train_time:1140590ms step_avg:228.71ms step:4988/6710 train_time:1140829ms step_avg:228.71ms step:4989/6710 train_time:1141069ms step_avg:228.72ms step:4990/6710 train_time:1141307ms step_avg:228.72ms step:4991/6710 train_time:1141542ms step_avg:228.72ms step:4992/6710 train_time:1141781ms step_avg:228.72ms step:4993/6710 train_time:1142019ms step_avg:228.72ms step:4994/6710 train_time:1142259ms step_avg:228.73ms step:4995/6710 train_time:1142495ms step_avg:228.73ms step:4996/6710 train_time:1142737ms step_avg:228.73ms step:4997/6710 train_time:1142975ms step_avg:228.73ms step:4998/6710 train_time:1143213ms step_avg:228.73ms step:4999/6710 train_time:1143453ms step_avg:228.74ms step:5000/6710 train_time:1143691ms step_avg:228.74ms step:5000/6710 val_loss:3.012474 train_time:1143882ms step_avg:228.78ms Parameter containing: tensor([1.0000, 1.0000, 0.4076, 1.0000, 0.5029, 1.0000, 0.4080, 1.0000], device='cuda:0', requires_grad=True) 0 [7.410426139831543, 6.41042423248291] 1 [0.49320563673973083, 5.901867389678955] 2 [0.6606616973876953, 3.6787843704223633] 3 [0.6816691160202026, 3.1140389442443848] 4 [0.39217889308929443, 2.2926928997039795] 5 [0.6350106596946716, 3.080094575881958] 6 [0.509268581867218, 2.101241111755371] 7 [0.7006411552429199, 4.93300724029541] 8 [0.475391685962677, 0.5146291851997375] 9 [0.49000319838523865, 1.684253215789795] 10 [0.62978196144104, 2.292253255844116] 11 [0.4523492157459259, 2.400905132293701] 12 [0.8775443434715271, 5.653470039367676] 13 [0.9709017276763916, 3.074302911758423] 14 [0.939986526966095, 1.0577778816223145] 15 [0.8781464099884033, -0.018865443766117096] 0 [13.823981285095215, 23.212736129760742, 29.35694122314453] 1 [26.44449806213379, 24.64200782775879, 63.079463958740234] 2 [55.30887985229492, 19.621742248535156, 26.3061466217041] 3 [51.66219711303711, 25.44293212890625, 31.083328247070312] 4 [31.57318115234375, 23.763017654418945, 27.137758255004883] 5 [39.4768180847168, 22.775537490844727, 33.82893753051758] 6 [36.54262924194336, 25.898229598999023, 25.873884201049805] 7 [46.617767333984375, 0.0, 36.94286346435547] 8 [33.0532341003418, 26.128875732421875, 39.2940559387207] 9 [45.76978302001953, 22.944473266601562, 32.27339553833008] 10 [60.668663024902344, 23.930936813354492, 31.455793380737305] 11 [49.89700698852539, 29.20606803894043, 19.376361846923828] 12 [70.75929260253906, 23.82752227783203, 20.360307693481445] 13 [91.42081451416016, 17.346477508544922, 23.577289581298828] 14 [99.69601440429688, 20.308454513549805, 32.195350646972656] 15 [103.69021606445312, 71.26903533935547, 116.67001342773438] step:5001/6710 train_time:1143933ms step_avg:228.74ms step:5002/6710 train_time:1144170ms step_avg:228.74ms step:5003/6710 train_time:1144414ms step_avg:228.75ms step:5004/6710 train_time:1144651ms step_avg:228.75ms step:5005/6710 train_time:1144889ms step_avg:228.75ms step:5006/6710 train_time:1145126ms step_avg:228.75ms step:5007/6710 train_time:1145368ms step_avg:228.75ms step:5008/6710 train_time:1145606ms step_avg:228.76ms step:5009/6710 train_time:1145844ms step_avg:228.76ms step:5010/6710 train_time:1146081ms step_avg:228.76ms step:5011/6710 train_time:1146319ms step_avg:228.76ms step:5012/6710 train_time:1146556ms step_avg:228.76ms step:5013/6710 train_time:1146795ms step_avg:228.76ms step:5014/6710 train_time:1147032ms step_avg:228.77ms step:5015/6710 train_time:1147272ms step_avg:228.77ms step:5016/6710 train_time:1147511ms step_avg:228.77ms step:5017/6710 train_time:1147751ms step_avg:228.77ms step:5018/6710 train_time:1147988ms step_avg:228.77ms step:5019/6710 train_time:1148227ms step_avg:228.78ms step:5020/6710 train_time:1148466ms step_avg:228.78ms step:5021/6710 train_time:1148705ms step_avg:228.78ms step:5022/6710 train_time:1148943ms step_avg:228.78ms step:5023/6710 train_time:1149182ms step_avg:228.78ms step:5024/6710 train_time:1149421ms step_avg:228.79ms step:5025/6710 train_time:1149659ms step_avg:228.79ms step:5026/6710 train_time:1149898ms step_avg:228.79ms step:5027/6710 train_time:1150135ms step_avg:228.79ms step:5028/6710 train_time:1150371ms step_avg:228.79ms step:5029/6710 train_time:1150611ms step_avg:228.80ms step:5030/6710 train_time:1150849ms step_avg:228.80ms step:5031/6710 train_time:1151089ms step_avg:228.80ms step:5032/6710 train_time:1151326ms step_avg:228.80ms step:5033/6710 train_time:1151565ms step_avg:228.80ms step:5034/6710 train_time:1151802ms step_avg:228.80ms step:5035/6710 train_time:1152041ms step_avg:228.81ms step:5036/6710 train_time:1152282ms step_avg:228.81ms step:5037/6710 train_time:1152524ms step_avg:228.81ms step:5038/6710 train_time:1152762ms step_avg:228.81ms step:5039/6710 train_time:1153001ms step_avg:228.82ms step:5040/6710 train_time:1153244ms step_avg:228.82ms step:5041/6710 train_time:1153483ms step_avg:228.82ms step:5042/6710 train_time:1153720ms step_avg:228.82ms step:5043/6710 train_time:1153957ms step_avg:228.82ms step:5044/6710 train_time:1154195ms step_avg:228.83ms step:5045/6710 train_time:1154435ms step_avg:228.83ms step:5046/6710 train_time:1154673ms step_avg:228.83ms step:5047/6710 train_time:1154915ms step_avg:228.83ms step:5048/6710 train_time:1155152ms step_avg:228.83ms step:5049/6710 train_time:1155390ms step_avg:228.84ms step:5050/6710 train_time:1155627ms step_avg:228.84ms step:5051/6710 train_time:1155865ms step_avg:228.84ms step:5052/6710 train_time:1156102ms step_avg:228.84ms step:5053/6710 train_time:1156340ms step_avg:228.84ms step:5054/6710 train_time:1156578ms step_avg:228.84ms step:5055/6710 train_time:1156819ms step_avg:228.85ms step:5056/6710 train_time:1157054ms step_avg:228.85ms step:5057/6710 train_time:1157291ms step_avg:228.85ms step:5058/6710 train_time:1157530ms step_avg:228.85ms step:5059/6710 train_time:1157769ms step_avg:228.85ms step:5060/6710 train_time:1158008ms step_avg:228.86ms step:5061/6710 train_time:1158248ms step_avg:228.86ms step:5062/6710 train_time:1158487ms step_avg:228.86ms step:5063/6710 train_time:1158724ms step_avg:228.86ms step:5064/6710 train_time:1158963ms step_avg:228.86ms step:5065/6710 train_time:1159202ms step_avg:228.87ms step:5066/6710 train_time:1159440ms step_avg:228.87ms step:5067/6710 train_time:1159678ms step_avg:228.87ms step:5068/6710 train_time:1159915ms step_avg:228.87ms step:5069/6710 train_time:1160153ms step_avg:228.87ms step:5070/6710 train_time:1160391ms step_avg:228.87ms step:5071/6710 train_time:1160630ms step_avg:228.88ms step:5072/6710 train_time:1160867ms step_avg:228.88ms step:5073/6710 train_time:1161105ms step_avg:228.88ms step:5074/6710 train_time:1161345ms step_avg:228.88ms step:5075/6710 train_time:1161582ms step_avg:228.88ms step:5076/6710 train_time:1161820ms step_avg:228.88ms step:5077/6710 train_time:1162058ms step_avg:228.89ms step:5078/6710 train_time:1162300ms step_avg:228.89ms step:5079/6710 train_time:1162542ms step_avg:228.89ms step:5080/6710 train_time:1162784ms step_avg:228.89ms step:5081/6710 train_time:1163021ms step_avg:228.90ms step:5082/6710 train_time:1163257ms step_avg:228.90ms step:5083/6710 train_time:1163496ms step_avg:228.90ms step:5084/6710 train_time:1163734ms step_avg:228.90ms step:5085/6710 train_time:1163975ms step_avg:228.90ms step:5086/6710 train_time:1164216ms step_avg:228.91ms step:5087/6710 train_time:1164452ms step_avg:228.91ms step:5088/6710 train_time:1164694ms step_avg:228.91ms step:5089/6710 train_time:1164931ms step_avg:228.91ms step:5090/6710 train_time:1165168ms step_avg:228.91ms step:5091/6710 train_time:1165406ms step_avg:228.91ms step:5092/6710 train_time:1165647ms step_avg:228.92ms step:5093/6710 train_time:1165887ms step_avg:228.92ms step:5094/6710 train_time:1166129ms step_avg:228.92ms step:5095/6710 train_time:1166367ms step_avg:228.92ms step:5096/6710 train_time:1166608ms step_avg:228.93ms step:5097/6710 train_time:1166845ms step_avg:228.93ms step:5098/6710 train_time:1167085ms step_avg:228.93ms step:5099/6710 train_time:1167325ms step_avg:228.93ms step:5100/6710 train_time:1167564ms step_avg:228.93ms step:5101/6710 train_time:1167807ms step_avg:228.94ms step:5102/6710 train_time:1168046ms step_avg:228.94ms step:5103/6710 train_time:1168285ms step_avg:228.94ms step:5104/6710 train_time:1168522ms step_avg:228.94ms step:5105/6710 train_time:1168763ms step_avg:228.94ms step:5106/6710 train_time:1169003ms step_avg:228.95ms step:5107/6710 train_time:1169240ms step_avg:228.95ms step:5108/6710 train_time:1169477ms step_avg:228.95ms step:5109/6710 train_time:1169716ms step_avg:228.95ms step:5110/6710 train_time:1169954ms step_avg:228.95ms step:5111/6710 train_time:1170191ms step_avg:228.96ms step:5112/6710 train_time:1170429ms step_avg:228.96ms step:5113/6710 train_time:1170668ms step_avg:228.96ms step:5114/6710 train_time:1170907ms step_avg:228.96ms step:5115/6710 train_time:1171146ms step_avg:228.96ms step:5116/6710 train_time:1171387ms step_avg:228.97ms step:5117/6710 train_time:1171626ms step_avg:228.97ms step:5118/6710 train_time:1171863ms step_avg:228.97ms step:5119/6710 train_time:1172101ms step_avg:228.97ms step:5120/6710 train_time:1172341ms step_avg:228.97ms step:5121/6710 train_time:1172582ms step_avg:228.98ms step:5122/6710 train_time:1172820ms step_avg:228.98ms step:5123/6710 train_time:1173056ms step_avg:228.98ms step:5124/6710 train_time:1173297ms step_avg:228.98ms step:5125/6710 train_time:1173535ms step_avg:228.98ms step:5125/6710 val_loss:3.004288 train_time:1173725ms step_avg:229.02ms Parameter containing: tensor([1.0000, 1.0000, 0.4073, 1.0000, 0.5060, 1.0000, 0.4063, 1.0000], device='cuda:0', requires_grad=True) 0 [7.352531909942627, 6.352530002593994] 1 [0.48888668417930603, 5.806914806365967] 2 [0.6511568427085876, 3.5572807788848877] 3 [0.6805934309959412, 3.0143325328826904] 4 [0.39397919178009033, 2.2231998443603516] 5 [0.6230712532997131, 2.9860832691192627] 6 [0.5131480693817139, 2.018434524536133] 7 [0.7008132934570312, 4.828225612640381] 8 [0.4844670295715332, 0.4277021586894989] 9 [0.4940509498119354, 1.6206215620040894] 10 [0.6338182091712952, 2.206193208694458] 11 [0.4539909064769745, 2.320730209350586] 12 [0.8748450875282288, 5.564755439758301] 13 [0.9608470797538757, 3.0161831378936768] 14 [0.9357617497444153, 0.9921724796295166] 15 [0.87663334608078, -0.093462735414505] 0 [13.709152221679688, 22.809261322021484, 29.010334014892578] 1 [25.862089157104492, 24.111196517944336, 61.79491424560547] 2 [53.347251892089844, 19.135141372680664, 25.95013999938965] 3 [50.07076644897461, 24.900554656982422, 30.337209701538086] 4 [30.814517974853516, 23.135038375854492, 26.787220001220703] 5 [37.91080093383789, 22.318391799926758, 33.164920806884766] 6 [35.68564987182617, 25.35393714904785, 25.2377872467041] 7 [45.4833869934082, 0.0, 35.61249923706055] 8 [32.62076950073242, 25.41619873046875, 38.358787536621094] 9 [45.03955078125, 22.25871467590332, 31.687469482421875] 10 [59.82936477661133, 23.383920669555664, 31.22537612915039] 11 [49.20915222167969, 28.544231414794922, 19.206892013549805] 12 [69.35407257080078, 23.327739715576172, 20.0579891204834] 13 [88.60011291503906, 16.916179656982422, 23.175933837890625] 14 [96.40277099609375, 19.80704116821289, 30.91542625427246] 15 [100.18685150146484, 69.47402954101562, 112.73685455322266] step:5126/6710 train_time:1173776ms step_avg:228.98ms step:5127/6710 train_time:1174013ms step_avg:228.99ms step:5128/6710 train_time:1174256ms step_avg:228.99ms step:5129/6710 train_time:1174495ms step_avg:228.99ms step:5130/6710 train_time:1174736ms step_avg:228.99ms step:5131/6710 train_time:1174976ms step_avg:229.00ms step:5132/6710 train_time:1175216ms step_avg:229.00ms step:5133/6710 train_time:1175455ms step_avg:229.00ms step:5134/6710 train_time:1175693ms step_avg:229.00ms step:5135/6710 train_time:1175932ms step_avg:229.00ms step:5136/6710 train_time:1176171ms step_avg:229.01ms step:5137/6710 train_time:1176414ms step_avg:229.01ms step:5138/6710 train_time:1176655ms step_avg:229.01ms step:5139/6710 train_time:1176892ms step_avg:229.01ms step:5140/6710 train_time:1177131ms step_avg:229.01ms step:5141/6710 train_time:1177371ms step_avg:229.02ms step:5142/6710 train_time:1177608ms step_avg:229.02ms step:5143/6710 train_time:1177851ms step_avg:229.02ms step:5144/6710 train_time:1178090ms step_avg:229.02ms step:5145/6710 train_time:1178327ms step_avg:229.02ms step:5146/6710 train_time:1178567ms step_avg:229.03ms step:5147/6710 train_time:1178807ms step_avg:229.03ms step:5148/6710 train_time:1179047ms step_avg:229.03ms step:5149/6710 train_time:1179286ms step_avg:229.03ms step:5150/6710 train_time:1179524ms step_avg:229.03ms step:5151/6710 train_time:1179761ms step_avg:229.04ms step:5152/6710 train_time:1179997ms step_avg:229.04ms step:5153/6710 train_time:1180236ms step_avg:229.04ms step:5154/6710 train_time:1180474ms step_avg:229.04ms step:5155/6710 train_time:1180716ms step_avg:229.04ms step:5156/6710 train_time:1180954ms step_avg:229.04ms step:5157/6710 train_time:1181194ms step_avg:229.05ms step:5158/6710 train_time:1181433ms step_avg:229.05ms step:5159/6710 train_time:1181676ms step_avg:229.05ms step:5160/6710 train_time:1181918ms step_avg:229.05ms step:5161/6710 train_time:1182156ms step_avg:229.06ms step:5162/6710 train_time:1182394ms step_avg:229.06ms step:5163/6710 train_time:1182632ms step_avg:229.06ms step:5164/6710 train_time:1182873ms step_avg:229.06ms step:5165/6710 train_time:1183111ms step_avg:229.06ms step:5166/6710 train_time:1183351ms step_avg:229.07ms step:5167/6710 train_time:1183590ms step_avg:229.07ms step:5168/6710 train_time:1183834ms step_avg:229.07ms step:5169/6710 train_time:1184073ms step_avg:229.07ms step:5170/6710 train_time:1184309ms step_avg:229.07ms step:5171/6710 train_time:1184548ms step_avg:229.08ms step:5172/6710 train_time:1184788ms step_avg:229.08ms step:5173/6710 train_time:1185027ms step_avg:229.08ms step:5174/6710 train_time:1185266ms step_avg:229.08ms step:5175/6710 train_time:1185506ms step_avg:229.08ms step:5176/6710 train_time:1185745ms step_avg:229.09ms step:5177/6710 train_time:1185986ms step_avg:229.09ms step:5178/6710 train_time:1186222ms step_avg:229.09ms step:5179/6710 train_time:1186459ms step_avg:229.09ms step:5180/6710 train_time:1186701ms step_avg:229.09ms step:5181/6710 train_time:1186941ms step_avg:229.09ms step:5182/6710 train_time:1187177ms step_avg:229.10ms step:5183/6710 train_time:1187416ms step_avg:229.10ms step:5184/6710 train_time:1187657ms step_avg:229.10ms step:5185/6710 train_time:1187899ms step_avg:229.10ms step:5186/6710 train_time:1188135ms step_avg:229.10ms step:5187/6710 train_time:1188373ms step_avg:229.11ms step:5188/6710 train_time:1188613ms step_avg:229.11ms step:5189/6710 train_time:1188852ms step_avg:229.11ms step:5190/6710 train_time:1189089ms step_avg:229.11ms step:5191/6710 train_time:1189328ms step_avg:229.11ms step:5192/6710 train_time:1189570ms step_avg:229.12ms step:5193/6710 train_time:1189812ms step_avg:229.12ms step:5194/6710 train_time:1190049ms step_avg:229.12ms step:5195/6710 train_time:1190290ms step_avg:229.12ms step:5196/6710 train_time:1190526ms step_avg:229.12ms step:5197/6710 train_time:1190766ms step_avg:229.13ms step:5198/6710 train_time:1191009ms step_avg:229.13ms step:5199/6710 train_time:1191249ms step_avg:229.13ms step:5200/6710 train_time:1191489ms step_avg:229.13ms step:5201/6710 train_time:1191732ms step_avg:229.14ms step:5202/6710 train_time:1191974ms step_avg:229.14ms step:5203/6710 train_time:1192214ms step_avg:229.14ms step:5204/6710 train_time:1192450ms step_avg:229.14ms step:5205/6710 train_time:1192691ms step_avg:229.14ms step:5206/6710 train_time:1192932ms step_avg:229.15ms step:5207/6710 train_time:1193169ms step_avg:229.15ms step:5208/6710 train_time:1193409ms step_avg:229.15ms step:5209/6710 train_time:1193649ms step_avg:229.15ms step:5210/6710 train_time:1193888ms step_avg:229.15ms step:5211/6710 train_time:1194127ms step_avg:229.16ms step:5212/6710 train_time:1194364ms step_avg:229.16ms step:5213/6710 train_time:1194603ms step_avg:229.16ms step:5214/6710 train_time:1194842ms step_avg:229.16ms step:5215/6710 train_time:1195083ms step_avg:229.16ms step:5216/6710 train_time:1195321ms step_avg:229.16ms step:5217/6710 train_time:1195557ms step_avg:229.17ms step:5218/6710 train_time:1195796ms step_avg:229.17ms step:5219/6710 train_time:1196036ms step_avg:229.17ms step:5220/6710 train_time:1196274ms step_avg:229.17ms step:5221/6710 train_time:1196513ms step_avg:229.17ms step:5222/6710 train_time:1196752ms step_avg:229.18ms step:5223/6710 train_time:1196990ms step_avg:229.18ms step:5224/6710 train_time:1197229ms step_avg:229.18ms step:5225/6710 train_time:1197465ms step_avg:229.18ms step:5226/6710 train_time:1197703ms step_avg:229.18ms step:5227/6710 train_time:1197940ms step_avg:229.18ms step:5228/6710 train_time:1198180ms step_avg:229.19ms step:5229/6710 train_time:1198417ms step_avg:229.19ms step:5230/6710 train_time:1198655ms step_avg:229.19ms step:5231/6710 train_time:1198893ms step_avg:229.19ms step:5232/6710 train_time:1199131ms step_avg:229.19ms step:5233/6710 train_time:1199368ms step_avg:229.19ms step:5234/6710 train_time:1199609ms step_avg:229.20ms step:5235/6710 train_time:1199848ms step_avg:229.20ms step:5236/6710 train_time:1200088ms step_avg:229.20ms step:5237/6710 train_time:1200324ms step_avg:229.20ms step:5238/6710 train_time:1200564ms step_avg:229.20ms step:5239/6710 train_time:1200799ms step_avg:229.20ms step:5240/6710 train_time:1201040ms step_avg:229.21ms step:5241/6710 train_time:1201279ms step_avg:229.21ms step:5242/6710 train_time:1201516ms step_avg:229.21ms step:5243/6710 train_time:1201756ms step_avg:229.21ms step:5244/6710 train_time:1201994ms step_avg:229.21ms step:5245/6710 train_time:1202236ms step_avg:229.22ms step:5246/6710 train_time:1202473ms step_avg:229.22ms step:5247/6710 train_time:1202714ms step_avg:229.22ms step:5248/6710 train_time:1202952ms step_avg:229.22ms step:5249/6710 train_time:1203191ms step_avg:229.22ms step:5250/6710 train_time:1203428ms step_avg:229.22ms step:5250/6710 val_loss:2.996231 train_time:1203615ms step_avg:229.26ms Parameter containing: tensor([1.0000, 1.0000, 0.4089, 1.0000, 0.4972, 1.0000, 0.4031, 1.0000], device='cuda:0', requires_grad=True) 0 [7.300507545471191, 6.300505638122559] 1 [0.49460428953170776, 5.713593482971191] 2 [0.6470548510551453, 3.4514827728271484] 3 [0.6750762462615967, 2.9288909435272217] 4 [0.3999447822570801, 2.172232151031494] 5 [0.621207594871521, 2.9022672176361084] 6 [0.5179939270019531, 1.926757574081421] 7 [0.6914876699447632, 4.73323917388916] 8 [0.4849771559238434, 0.3566151261329651] 9 [0.4936077892780304, 1.5626877546310425] 10 [0.6268729567527771, 2.138237714767456] 11 [0.45652323961257935, 2.2561943531036377] 12 [0.8715552091598511, 5.4937872886657715] 13 [0.9528843760490417, 2.9747018814086914] 14 [0.9341464042663574, 0.9587427377700806] 15 [0.8833829164505005, -0.1436278373003006] 0 [13.603947639465332, 22.226505279541016, 28.820775985717773] 1 [25.748258590698242, 23.55054473876953, 59.977943420410156] 2 [51.80741882324219, 18.6899471282959, 25.36813735961914] 3 [48.362754821777344, 24.325668334960938, 29.753746032714844] 4 [30.377470016479492, 22.72675132751465, 26.643390655517578] 5 [37.23954772949219, 21.725521087646484, 32.510581970214844] 6 [35.25433349609375, 24.738874435424805, 24.980833053588867] 7 [44.14822006225586, 0.0, 34.92915344238281] 8 [31.850343704223633, 24.7325382232666, 37.66307067871094] 9 [43.95170593261719, 21.79441261291504, 31.18023681640625] 10 [57.77241516113281, 22.826366424560547, 30.737472534179688] 11 [48.062015533447266, 28.01258659362793, 19.02900505065918] 12 [67.66686248779297, 22.84257698059082, 19.928848266601562] 13 [85.96977233886719, 16.262136459350586, 22.646854400634766] 14 [93.47948455810547, 19.107315063476562, 30.260433197021484] 15 [97.96270751953125, 67.7748031616211, 110.67249298095703] step:5251/6710 train_time:1203666ms step_avg:229.23ms step:5252/6710 train_time:1203902ms step_avg:229.23ms step:5253/6710 train_time:1204144ms step_avg:229.23ms step:5254/6710 train_time:1204381ms step_avg:229.23ms step:5255/6710 train_time:1204623ms step_avg:229.23ms step:5256/6710 train_time:1204866ms step_avg:229.24ms step:5257/6710 train_time:1205105ms step_avg:229.24ms step:5258/6710 train_time:1205343ms step_avg:229.24ms step:5259/6710 train_time:1205581ms step_avg:229.24ms step:5260/6710 train_time:1205821ms step_avg:229.24ms step:5261/6710 train_time:1206060ms step_avg:229.25ms step:5262/6710 train_time:1206297ms step_avg:229.25ms step:5263/6710 train_time:1206535ms step_avg:229.25ms step:5264/6710 train_time:1206774ms step_avg:229.25ms step:5265/6710 train_time:1207012ms step_avg:229.25ms step:5266/6710 train_time:1207252ms step_avg:229.25ms step:5267/6710 train_time:1207488ms step_avg:229.26ms step:5268/6710 train_time:1207728ms step_avg:229.26ms step:5269/6710 train_time:1207967ms step_avg:229.26ms step:5270/6710 train_time:1208206ms step_avg:229.26ms step:5271/6710 train_time:1208444ms step_avg:229.26ms step:5272/6710 train_time:1208683ms step_avg:229.26ms step:5273/6710 train_time:1208923ms step_avg:229.27ms step:5274/6710 train_time:1209161ms step_avg:229.27ms step:5275/6710 train_time:1209402ms step_avg:229.27ms step:5276/6710 train_time:1209639ms step_avg:229.27ms step:5277/6710 train_time:1209878ms step_avg:229.27ms step:5278/6710 train_time:1210116ms step_avg:229.28ms step:5279/6710 train_time:1210356ms step_avg:229.28ms step:5280/6710 train_time:1210599ms step_avg:229.28ms step:5281/6710 train_time:1210836ms step_avg:229.28ms step:5282/6710 train_time:1211075ms step_avg:229.28ms step:5283/6710 train_time:1211315ms step_avg:229.29ms step:5284/6710 train_time:1211554ms step_avg:229.29ms step:5285/6710 train_time:1211791ms step_avg:229.29ms step:5286/6710 train_time:1212031ms step_avg:229.29ms step:5287/6710 train_time:1212270ms step_avg:229.29ms step:5288/6710 train_time:1212507ms step_avg:229.29ms step:5289/6710 train_time:1212744ms step_avg:229.30ms step:5290/6710 train_time:1212984ms step_avg:229.30ms step:5291/6710 train_time:1213224ms step_avg:229.30ms step:5292/6710 train_time:1213463ms step_avg:229.30ms step:5293/6710 train_time:1213704ms step_avg:229.30ms step:5294/6710 train_time:1213946ms step_avg:229.31ms step:5295/6710 train_time:1214184ms step_avg:229.31ms step:5296/6710 train_time:1214427ms step_avg:229.31ms step:5297/6710 train_time:1214667ms step_avg:229.31ms step:5298/6710 train_time:1214905ms step_avg:229.31ms step:5299/6710 train_time:1215144ms step_avg:229.32ms step:5300/6710 train_time:1215383ms step_avg:229.32ms step:5301/6710 train_time:1215623ms step_avg:229.32ms step:5302/6710 train_time:1215861ms step_avg:229.32ms step:5303/6710 train_time:1216099ms step_avg:229.32ms step:5304/6710 train_time:1216337ms step_avg:229.32ms step:5305/6710 train_time:1216578ms step_avg:229.33ms step:5306/6710 train_time:1216817ms step_avg:229.33ms step:5307/6710 train_time:1217055ms step_avg:229.33ms step:5308/6710 train_time:1217294ms step_avg:229.33ms step:5309/6710 train_time:1217532ms step_avg:229.33ms step:5310/6710 train_time:1217770ms step_avg:229.34ms step:5311/6710 train_time:1218008ms step_avg:229.34ms step:5312/6710 train_time:1218245ms step_avg:229.34ms step:5313/6710 train_time:1218492ms step_avg:229.34ms step:5314/6710 train_time:1218729ms step_avg:229.34ms step:5315/6710 train_time:1218968ms step_avg:229.34ms step:5316/6710 train_time:1219204ms step_avg:229.35ms step:5317/6710 train_time:1219443ms step_avg:229.35ms step:5318/6710 train_time:1219682ms step_avg:229.35ms step:5319/6710 train_time:1219919ms step_avg:229.35ms step:5320/6710 train_time:1220158ms step_avg:229.35ms step:5321/6710 train_time:1220397ms step_avg:229.35ms step:5322/6710 train_time:1220636ms step_avg:229.36ms step:5323/6710 train_time:1220875ms step_avg:229.36ms step:5324/6710 train_time:1221112ms step_avg:229.36ms step:5325/6710 train_time:1221350ms step_avg:229.36ms step:5326/6710 train_time:1221590ms step_avg:229.36ms step:5327/6710 train_time:1221828ms step_avg:229.37ms step:5328/6710 train_time:1222066ms step_avg:229.37ms step:5329/6710 train_time:1222306ms step_avg:229.37ms step:5330/6710 train_time:1222545ms step_avg:229.37ms step:5331/6710 train_time:1222788ms step_avg:229.37ms step:5332/6710 train_time:1223028ms step_avg:229.38ms step:5333/6710 train_time:1223266ms step_avg:229.38ms step:5334/6710 train_time:1223505ms step_avg:229.38ms step:5335/6710 train_time:1223744ms step_avg:229.38ms step:5336/6710 train_time:1223984ms step_avg:229.38ms step:5337/6710 train_time:1224222ms step_avg:229.38ms step:5338/6710 train_time:1224459ms step_avg:229.39ms step:5339/6710 train_time:1224699ms step_avg:229.39ms step:5340/6710 train_time:1224936ms step_avg:229.39ms step:5341/6710 train_time:1225175ms step_avg:229.39ms step:5342/6710 train_time:1225414ms step_avg:229.39ms step:5343/6710 train_time:1225651ms step_avg:229.39ms step:5344/6710 train_time:1225887ms step_avg:229.40ms step:5345/6710 train_time:1226126ms step_avg:229.40ms step:5346/6710 train_time:1226367ms step_avg:229.40ms step:5347/6710 train_time:1226605ms step_avg:229.40ms step:5348/6710 train_time:1226845ms step_avg:229.40ms step:5349/6710 train_time:1227084ms step_avg:229.40ms step:5350/6710 train_time:1227324ms step_avg:229.41ms step:5351/6710 train_time:1227566ms step_avg:229.41ms step:5352/6710 train_time:1227802ms step_avg:229.41ms step:5353/6710 train_time:1228039ms step_avg:229.41ms step:5354/6710 train_time:1228275ms step_avg:229.41ms step:5355/6710 train_time:1228518ms step_avg:229.42ms step:5356/6710 train_time:1228756ms step_avg:229.42ms step:5357/6710 train_time:1228993ms step_avg:229.42ms step:5358/6710 train_time:1229231ms step_avg:229.42ms step:5359/6710 train_time:1229469ms step_avg:229.42ms step:5360/6710 train_time:1229707ms step_avg:229.42ms step:5361/6710 train_time:1229945ms step_avg:229.42ms step:5362/6710 train_time:1230185ms step_avg:229.43ms step:5363/6710 train_time:1230425ms step_avg:229.43ms step:5364/6710 train_time:1230661ms step_avg:229.43ms step:5365/6710 train_time:1230901ms step_avg:229.43ms step:5366/6710 train_time:1231141ms step_avg:229.43ms step:5367/6710 train_time:1231381ms step_avg:229.44ms step:5368/6710 train_time:1231619ms step_avg:229.44ms step:5369/6710 train_time:1231859ms step_avg:229.44ms step:5370/6710 train_time:1232098ms step_avg:229.44ms step:5371/6710 train_time:1232340ms step_avg:229.44ms step:5372/6710 train_time:1232577ms step_avg:229.44ms step:5373/6710 train_time:1232815ms step_avg:229.45ms step:5374/6710 train_time:1233055ms step_avg:229.45ms step:5375/6710 train_time:1233295ms step_avg:229.45ms step:5375/6710 val_loss:2.989001 train_time:1233484ms step_avg:229.49ms Parameter containing: tensor([1.0000, 1.0000, 0.4086, 1.0000, 0.4929, 1.0000, 0.3953, 1.0000], device='cuda:0', requires_grad=True) 0 [7.230266571044922, 6.230264663696289] 1 [0.4900146722793579, 5.634909152984619] 2 [0.6320222616195679, 3.360023021697998] 3 [0.685654878616333, 2.8568482398986816] 4 [0.4003188908100128, 2.1185364723205566] 5 [0.6172142028808594, 2.8020434379577637] 6 [0.5135084390640259, 1.84274160861969] 7 [0.6846768260002136, 4.657920837402344] 8 [0.4826231598854065, 0.3053528666496277] 9 [0.4918438494205475, 1.5085391998291016] 10 [0.627539336681366, 2.0807015895843506] 11 [0.45833101868629456, 2.2054219245910645] 12 [0.8645062446594238, 5.416343688964844] 13 [0.9452071189880371, 2.9172327518463135] 14 [0.9312282800674438, 0.9073137640953064] 15 [0.8829900622367859, -0.1902437061071396] 0 [13.464994430541992, 21.808433532714844, 28.504478454589844] 1 [25.181533813476562, 23.139507293701172, 59.75601577758789] 2 [50.11479568481445, 18.209434509277344, 24.822227478027344] 3 [47.54084396362305, 23.67276954650879, 29.016605377197266] 4 [29.75804901123047, 22.122760772705078, 26.354393005371094] 5 [36.31441116333008, 21.262495040893555, 31.864057540893555] 6 [34.1589241027832, 24.221567153930664, 24.481657028198242] 7 [42.61552810668945, 0.0, 34.1134033203125] 8 [30.742961883544922, 24.26961326599121, 36.811737060546875] 9 [42.43292236328125, 21.275182723999023, 30.390640258789062] 10 [56.09733963012695, 22.425247192382812, 29.792068481445312] 11 [46.84803771972656, 27.428348541259766, 18.799259185791016] 12 [65.68203735351562, 22.56757354736328, 19.60304832458496] 13 [83.1624755859375, 15.850160598754883, 22.016246795654297] 14 [90.23566436767578, 18.669830322265625, 29.52333641052246] 15 [94.76075744628906, 65.9389877319336, 106.6334228515625] step:5376/6710 train_time:1233535ms step_avg:229.45ms step:5377/6710 train_time:1233771ms step_avg:229.45ms step:5378/6710 train_time:1234015ms step_avg:229.46ms step:5379/6710 train_time:1234251ms step_avg:229.46ms step:5380/6710 train_time:1234488ms step_avg:229.46ms step:5381/6710 train_time:1234728ms step_avg:229.46ms step:5382/6710 train_time:1234969ms step_avg:229.46ms step:5383/6710 train_time:1235208ms step_avg:229.46ms step:5384/6710 train_time:1235444ms step_avg:229.47ms step:5385/6710 train_time:1235682ms step_avg:229.47ms step:5386/6710 train_time:1235923ms step_avg:229.47ms step:5387/6710 train_time:1236160ms step_avg:229.47ms step:5388/6710 train_time:1236399ms step_avg:229.47ms step:5389/6710 train_time:1236636ms step_avg:229.47ms step:5390/6710 train_time:1236875ms step_avg:229.48ms step:5391/6710 train_time:1237116ms step_avg:229.48ms step:5392/6710 train_time:1237353ms step_avg:229.48ms step:5393/6710 train_time:1237589ms step_avg:229.48ms step:5394/6710 train_time:1237827ms step_avg:229.48ms step:5395/6710 train_time:1238067ms step_avg:229.48ms step:5396/6710 train_time:1238305ms step_avg:229.49ms step:5397/6710 train_time:1238547ms step_avg:229.49ms step:5398/6710 train_time:1238785ms step_avg:229.49ms step:5399/6710 train_time:1239029ms step_avg:229.49ms step:5400/6710 train_time:1239267ms step_avg:229.49ms step:5401/6710 train_time:1239503ms step_avg:229.50ms step:5402/6710 train_time:1239741ms step_avg:229.50ms step:5403/6710 train_time:1239981ms step_avg:229.50ms step:5404/6710 train_time:1240222ms step_avg:229.50ms step:5405/6710 train_time:1240461ms step_avg:229.50ms step:5406/6710 train_time:1240698ms step_avg:229.50ms step:5407/6710 train_time:1240936ms step_avg:229.51ms step:5408/6710 train_time:1241175ms step_avg:229.51ms step:5409/6710 train_time:1241413ms step_avg:229.51ms step:5410/6710 train_time:1241649ms step_avg:229.51ms step:5411/6710 train_time:1241888ms step_avg:229.51ms step:5412/6710 train_time:1242127ms step_avg:229.51ms step:5413/6710 train_time:1242368ms step_avg:229.52ms step:5414/6710 train_time:1242606ms step_avg:229.52ms step:5415/6710 train_time:1242843ms step_avg:229.52ms step:5416/6710 train_time:1243084ms step_avg:229.52ms step:5417/6710 train_time:1243322ms step_avg:229.52ms step:5418/6710 train_time:1243560ms step_avg:229.52ms step:5419/6710 train_time:1243798ms step_avg:229.53ms step:5420/6710 train_time:1244037ms step_avg:229.53ms step:5421/6710 train_time:1244274ms step_avg:229.53ms step:5422/6710 train_time:1244512ms step_avg:229.53ms step:5423/6710 train_time:1244751ms step_avg:229.53ms step:5424/6710 train_time:1244993ms step_avg:229.53ms step:5425/6710 train_time:1245233ms step_avg:229.54ms step:5426/6710 train_time:1245472ms step_avg:229.54ms step:5427/6710 train_time:1245710ms step_avg:229.54ms step:5428/6710 train_time:1245947ms step_avg:229.54ms step:5429/6710 train_time:1246187ms step_avg:229.54ms step:5430/6710 train_time:1246423ms step_avg:229.54ms step:5431/6710 train_time:1246661ms step_avg:229.55ms step:5432/6710 train_time:1246900ms step_avg:229.55ms step:5433/6710 train_time:1247140ms step_avg:229.55ms step:5434/6710 train_time:1247380ms step_avg:229.55ms step:5435/6710 train_time:1247619ms step_avg:229.55ms step:5436/6710 train_time:1247858ms step_avg:229.55ms step:5437/6710 train_time:1248094ms step_avg:229.56ms step:5438/6710 train_time:1248337ms step_avg:229.56ms step:5439/6710 train_time:1248576ms step_avg:229.56ms step:5440/6710 train_time:1248813ms step_avg:229.56ms step:5441/6710 train_time:1249053ms step_avg:229.56ms step:5442/6710 train_time:1249292ms step_avg:229.56ms step:5443/6710 train_time:1249532ms step_avg:229.57ms step:5444/6710 train_time:1249771ms step_avg:229.57ms step:5445/6710 train_time:1250009ms step_avg:229.57ms step:5446/6710 train_time:1250248ms step_avg:229.57ms step:5447/6710 train_time:1250488ms step_avg:229.57ms step:5448/6710 train_time:1250726ms step_avg:229.58ms step:5449/6710 train_time:1250967ms step_avg:229.58ms step:5450/6710 train_time:1251205ms step_avg:229.58ms step:5451/6710 train_time:1251446ms step_avg:229.58ms step:5452/6710 train_time:1251685ms step_avg:229.58ms step:5453/6710 train_time:1251925ms step_avg:229.58ms step:5454/6710 train_time:1252164ms step_avg:229.59ms step:5455/6710 train_time:1252403ms step_avg:229.59ms step:5456/6710 train_time:1252641ms step_avg:229.59ms step:5457/6710 train_time:1252882ms step_avg:229.59ms step:5458/6710 train_time:1253118ms step_avg:229.59ms step:5459/6710 train_time:1253357ms step_avg:229.59ms step:5460/6710 train_time:1253596ms step_avg:229.60ms step:5461/6710 train_time:1253836ms step_avg:229.60ms step:5462/6710 train_time:1254076ms step_avg:229.60ms step:5463/6710 train_time:1254316ms step_avg:229.60ms step:5464/6710 train_time:1254556ms step_avg:229.60ms step:5465/6710 train_time:1254794ms step_avg:229.61ms step:5466/6710 train_time:1255031ms step_avg:229.61ms step:5467/6710 train_time:1255270ms step_avg:229.61ms step:5468/6710 train_time:1255507ms step_avg:229.61ms step:5469/6710 train_time:1255749ms step_avg:229.61ms step:5470/6710 train_time:1255988ms step_avg:229.61ms step:5471/6710 train_time:1256229ms step_avg:229.62ms step:5472/6710 train_time:1256469ms step_avg:229.62ms step:5473/6710 train_time:1256710ms step_avg:229.62ms step:5474/6710 train_time:1256949ms step_avg:229.62ms step:5475/6710 train_time:1257193ms step_avg:229.62ms step:5476/6710 train_time:1257434ms step_avg:229.63ms step:5477/6710 train_time:1257673ms step_avg:229.63ms step:5478/6710 train_time:1257913ms step_avg:229.63ms step:5479/6710 train_time:1258156ms step_avg:229.63ms step:5480/6710 train_time:1258398ms step_avg:229.63ms step:5481/6710 train_time:1258640ms step_avg:229.64ms step:5482/6710 train_time:1258882ms step_avg:229.64ms step:5483/6710 train_time:1259124ms step_avg:229.64ms step:5484/6710 train_time:1259367ms step_avg:229.64ms step:5485/6710 train_time:1259606ms step_avg:229.65ms step:5486/6710 train_time:1259848ms step_avg:229.65ms step:5487/6710 train_time:1260097ms step_avg:229.65ms step:5488/6710 train_time:1260338ms step_avg:229.65ms step:5489/6710 train_time:1260580ms step_avg:229.66ms step:5490/6710 train_time:1260819ms step_avg:229.66ms step:5491/6710 train_time:1261062ms step_avg:229.66ms step:5492/6710 train_time:1261303ms step_avg:229.66ms step:5493/6710 train_time:1261545ms step_avg:229.66ms step:5494/6710 train_time:1261785ms step_avg:229.67ms step:5495/6710 train_time:1262031ms step_avg:229.67ms step:5496/6710 train_time:1262270ms step_avg:229.67ms step:5497/6710 train_time:1262510ms step_avg:229.67ms step:5498/6710 train_time:1262752ms step_avg:229.67ms step:5499/6710 train_time:1262993ms step_avg:229.68ms step:5500/6710 train_time:1263236ms step_avg:229.68ms step:5500/6710 val_loss:2.980917 train_time:1263426ms step_avg:229.71ms Parameter containing: tensor([1.0000, 1.0000, 0.4078, 1.0000, 0.4850, 1.0000, 0.3914, 1.0000], device='cuda:0', requires_grad=True) 0 [7.15593147277832, 6.1559295654296875] 1 [0.48693907260894775, 5.5159149169921875] 2 [0.6274405121803284, 3.237460136413574] 3 [0.685496985912323, 2.760209321975708] 4 [0.40746182203292847, 2.0491254329681396] 5 [0.606309175491333, 2.6943166255950928] 6 [0.5185825228691101, 1.743574857711792] 7 [0.683735191822052, 4.543481826782227] 8 [0.4856742024421692, 0.20892085134983063] 9 [0.48823031783103943, 1.4268139600753784] 10 [0.6237151622772217, 2.0011422634124756] 11 [0.46099358797073364, 2.118128538131714] 12 [0.8653669953346252, 5.313226699829102] 13 [0.9389949440956116, 2.8454389572143555] 14 [0.9278438091278076, 0.8532629013061523] 15 [0.8860764503479004, -0.2464248090982437] 0 [13.316262245178223, 21.4061279296875, 27.891847610473633] 1 [24.540075302124023, 22.538816452026367, 59.42407989501953] 2 [49.076904296875, 17.566513061523438, 23.985767364501953] 3 [46.272037506103516, 23.00115394592285, 28.25519561767578] 4 [29.410282135009766, 21.693939208984375, 25.648181915283203] 5 [34.96238327026367, 20.6544132232666, 31.205245971679688] 6 [33.42698669433594, 23.527496337890625, 23.961162567138672] 7 [41.445213317871094, 0.0, 33.31083297729492] 8 [30.09371566772461, 23.447546005249023, 36.26824188232422] 9 [41.056461334228516, 20.62626075744629, 29.61614227294922] 10 [53.90050506591797, 21.790302276611328, 29.35235023498535] 11 [45.62035369873047, 26.814027786254883, 18.533382415771484] 12 [64.11946105957031, 22.165283203125, 19.25044822692871] 13 [80.76848602294922, 15.529581069946289, 21.575368881225586] 14 [87.50179290771484, 18.206655502319336, 28.688142776489258] 15 [92.30421447753906, 64.11641693115234, 104.19085693359375] step:5501/6710 train_time:1263478ms step_avg:229.68ms step:5502/6710 train_time:1263719ms step_avg:229.68ms step:5503/6710 train_time:1263962ms step_avg:229.69ms step:5504/6710 train_time:1264204ms step_avg:229.69ms step:5505/6710 train_time:1264449ms step_avg:229.69ms step:5506/6710 train_time:1264690ms step_avg:229.69ms step:5507/6710 train_time:1264929ms step_avg:229.69ms step:5508/6710 train_time:1265172ms step_avg:229.70ms step:5509/6710 train_time:1265412ms step_avg:229.70ms step:5510/6710 train_time:1265655ms step_avg:229.70ms step:5511/6710 train_time:1265898ms step_avg:229.70ms step:5512/6710 train_time:1266138ms step_avg:229.71ms step:5513/6710 train_time:1266379ms step_avg:229.71ms step:5514/6710 train_time:1266623ms step_avg:229.71ms step:5515/6710 train_time:1266866ms step_avg:229.71ms step:5516/6710 train_time:1267107ms step_avg:229.71ms step:5517/6710 train_time:1267346ms step_avg:229.72ms step:5518/6710 train_time:1267588ms step_avg:229.72ms step:5519/6710 train_time:1267830ms step_avg:229.72ms step:5520/6710 train_time:1268072ms step_avg:229.72ms step:5521/6710 train_time:1268316ms step_avg:229.73ms step:5522/6710 train_time:1268562ms step_avg:229.73ms step:5523/6710 train_time:1268800ms step_avg:229.73ms step:5524/6710 train_time:1269042ms step_avg:229.73ms step:5525/6710 train_time:1269288ms step_avg:229.74ms step:5526/6710 train_time:1269531ms step_avg:229.74ms step:5527/6710 train_time:1269771ms step_avg:229.74ms step:5528/6710 train_time:1270014ms step_avg:229.74ms step:5529/6710 train_time:1270258ms step_avg:229.74ms step:5530/6710 train_time:1270504ms step_avg:229.75ms step:5531/6710 train_time:1270743ms step_avg:229.75ms step:5532/6710 train_time:1270982ms step_avg:229.75ms step:5533/6710 train_time:1271226ms step_avg:229.75ms step:5534/6710 train_time:1271467ms step_avg:229.76ms step:5535/6710 train_time:1271708ms step_avg:229.76ms step:5536/6710 train_time:1271947ms step_avg:229.76ms step:5537/6710 train_time:1272185ms step_avg:229.76ms step:5538/6710 train_time:1272426ms step_avg:229.76ms step:5539/6710 train_time:1272670ms step_avg:229.77ms step:5540/6710 train_time:1272912ms step_avg:229.77ms step:5541/6710 train_time:1273154ms step_avg:229.77ms step:5542/6710 train_time:1273397ms step_avg:229.77ms step:5543/6710 train_time:1273642ms step_avg:229.77ms step:5544/6710 train_time:1273883ms step_avg:229.78ms step:5545/6710 train_time:1274123ms step_avg:229.78ms step:5546/6710 train_time:1274365ms step_avg:229.78ms step:5547/6710 train_time:1274604ms step_avg:229.78ms step:5548/6710 train_time:1274848ms step_avg:229.79ms step:5549/6710 train_time:1275092ms step_avg:229.79ms step:5550/6710 train_time:1275333ms step_avg:229.79ms step:5551/6710 train_time:1275575ms step_avg:229.79ms step:5552/6710 train_time:1275820ms step_avg:229.79ms step:5553/6710 train_time:1276059ms step_avg:229.80ms step:5554/6710 train_time:1276298ms step_avg:229.80ms step:5555/6710 train_time:1276540ms step_avg:229.80ms step:5556/6710 train_time:1276779ms step_avg:229.80ms step:5557/6710 train_time:1277021ms step_avg:229.80ms step:5558/6710 train_time:1277264ms step_avg:229.81ms step:5559/6710 train_time:1277505ms step_avg:229.81ms step:5560/6710 train_time:1277745ms step_avg:229.81ms step:5561/6710 train_time:1277985ms step_avg:229.81ms step:5562/6710 train_time:1278226ms step_avg:229.81ms step:5563/6710 train_time:1278468ms step_avg:229.82ms step:5564/6710 train_time:1278711ms step_avg:229.82ms step:5565/6710 train_time:1278953ms step_avg:229.82ms step:5566/6710 train_time:1279200ms step_avg:229.82ms step:5567/6710 train_time:1279441ms step_avg:229.83ms step:5568/6710 train_time:1279682ms step_avg:229.83ms step:5569/6710 train_time:1279925ms step_avg:229.83ms step:5570/6710 train_time:1280167ms step_avg:229.83ms step:5571/6710 train_time:1280407ms step_avg:229.83ms step:5572/6710 train_time:1280649ms step_avg:229.84ms step:5573/6710 train_time:1280892ms step_avg:229.84ms step:5574/6710 train_time:1281139ms step_avg:229.84ms step:5575/6710 train_time:1281378ms step_avg:229.84ms step:5576/6710 train_time:1281618ms step_avg:229.85ms step:5577/6710 train_time:1281858ms step_avg:229.85ms step:5578/6710 train_time:1282101ms step_avg:229.85ms step:5579/6710 train_time:1282340ms step_avg:229.85ms step:5580/6710 train_time:1282582ms step_avg:229.85ms step:5581/6710 train_time:1282824ms step_avg:229.86ms step:5582/6710 train_time:1283065ms step_avg:229.86ms step:5583/6710 train_time:1283305ms step_avg:229.86ms step:5584/6710 train_time:1283545ms step_avg:229.86ms step:5585/6710 train_time:1283787ms step_avg:229.86ms step:5586/6710 train_time:1284028ms step_avg:229.87ms step:5587/6710 train_time:1284270ms step_avg:229.87ms step:5588/6710 train_time:1284509ms step_avg:229.87ms step:5589/6710 train_time:1284753ms step_avg:229.87ms step:5590/6710 train_time:1284992ms step_avg:229.87ms step:5591/6710 train_time:1285232ms step_avg:229.88ms step:5592/6710 train_time:1285475ms step_avg:229.88ms step:5593/6710 train_time:1285715ms step_avg:229.88ms step:5594/6710 train_time:1285957ms step_avg:229.88ms step:5595/6710 train_time:1286196ms step_avg:229.88ms step:5596/6710 train_time:1286440ms step_avg:229.89ms step:5597/6710 train_time:1286682ms step_avg:229.89ms step:5598/6710 train_time:1286923ms step_avg:229.89ms step:5599/6710 train_time:1287165ms step_avg:229.89ms step:5600/6710 train_time:1287407ms step_avg:229.89ms step:5601/6710 train_time:1287646ms step_avg:229.90ms step:5602/6710 train_time:1287890ms step_avg:229.90ms step:5603/6710 train_time:1288128ms step_avg:229.90ms step:5604/6710 train_time:1288371ms step_avg:229.90ms step:5605/6710 train_time:1288612ms step_avg:229.90ms step:5606/6710 train_time:1288858ms step_avg:229.91ms step:5607/6710 train_time:1289099ms step_avg:229.91ms step:5608/6710 train_time:1289341ms step_avg:229.91ms step:5609/6710 train_time:1289582ms step_avg:229.91ms step:5610/6710 train_time:1289825ms step_avg:229.92ms step:5611/6710 train_time:1290066ms step_avg:229.92ms step:5612/6710 train_time:1290308ms step_avg:229.92ms step:5613/6710 train_time:1290549ms step_avg:229.92ms step:5614/6710 train_time:1290792ms step_avg:229.92ms step:5615/6710 train_time:1291032ms step_avg:229.93ms step:5616/6710 train_time:1291278ms step_avg:229.93ms step:5617/6710 train_time:1291523ms step_avg:229.93ms step:5618/6710 train_time:1291761ms step_avg:229.93ms step:5619/6710 train_time:1292014ms step_avg:229.94ms step:5620/6710 train_time:1292253ms step_avg:229.94ms step:5621/6710 train_time:1292492ms step_avg:229.94ms step:5622/6710 train_time:1292733ms step_avg:229.94ms step:5623/6710 train_time:1292977ms step_avg:229.94ms step:5624/6710 train_time:1293219ms step_avg:229.95ms step:5625/6710 train_time:1293458ms step_avg:229.95ms step:5625/6710 val_loss:2.973513 train_time:1293648ms step_avg:229.98ms Parameter containing: tensor([1.0000, 1.0000, 0.4081, 1.0000, 0.4804, 1.0000, 0.3901, 1.0000], device='cuda:0', requires_grad=True) 0 [7.100879192352295, 6.100877285003662] 1 [0.48626959323883057, 5.410068035125732] 2 [0.6248505115509033, 3.1374716758728027] 3 [0.678866446018219, 2.669301986694336] 4 [0.4088243544101715, 2.0027549266815186] 5 [0.6031954288482666, 2.6001663208007812] 6 [0.5231689214706421, 1.6805706024169922] 7 [0.6813527345657349, 4.460036277770996] 8 [0.4906112849712372, 0.13500770926475525] 9 [0.4921431243419647, 1.3815689086914062] 10 [0.625578761100769, 1.9405057430267334] 11 [0.45821788907051086, 2.0627224445343018] 12 [0.8645539879798889, 5.220833778381348] 13 [0.9335287809371948, 2.7805137634277344] 14 [0.9256278276443481, 0.8025783896446228] 15 [0.8889406323432922, -0.3024553954601288] 0 [13.205183982849121, 20.875112533569336, 27.819259643554688] 1 [24.202747344970703, 22.048078536987305, 58.46070861816406] 2 [48.06254577636719, 17.21537208557129, 23.57957649230957] 3 [44.90956497192383, 22.48682403564453, 27.481182098388672] 4 [28.68776512145996, 21.23604393005371, 25.253002166748047] 5 [34.01756286621094, 20.138198852539062, 30.6137752532959] 6 [32.875911712646484, 23.02898406982422, 23.711097717285156] 7 [40.63523483276367, 0.0, 32.27657699584961] 8 [29.63728904724121, 22.91582489013672, 35.557533264160156] 9 [40.555625915527344, 20.113981246948242, 29.34349250793457] 10 [53.048274993896484, 21.367162704467773, 28.86475944519043] 11 [44.531063079833984, 26.13309669494629, 18.340167999267578] 12 [62.57772445678711, 21.691604614257812, 19.03702163696289] 13 [78.41228485107422, 15.125577926635742, 21.18573760986328] 14 [84.81041717529297, 17.76308822631836, 28.29610252380371] 15 [89.93726348876953, 62.15947723388672, 100.38521575927734] step:5626/6710 train_time:1293700ms step_avg:229.95ms step:5627/6710 train_time:1293939ms step_avg:229.95ms step:5628/6710 train_time:1294186ms step_avg:229.95ms step:5629/6710 train_time:1294428ms step_avg:229.96ms step:5630/6710 train_time:1294670ms step_avg:229.96ms step:5631/6710 train_time:1294909ms step_avg:229.96ms step:5632/6710 train_time:1295152ms step_avg:229.96ms step:5633/6710 train_time:1295391ms step_avg:229.96ms step:5634/6710 train_time:1295632ms step_avg:229.97ms step:5635/6710 train_time:1295876ms step_avg:229.97ms step:5636/6710 train_time:1296115ms step_avg:229.97ms step:5637/6710 train_time:1296357ms step_avg:229.97ms step:5638/6710 train_time:1296595ms step_avg:229.97ms step:5639/6710 train_time:1296841ms step_avg:229.98ms step:5640/6710 train_time:1297083ms step_avg:229.98ms step:5641/6710 train_time:1297326ms step_avg:229.98ms step:5642/6710 train_time:1297567ms step_avg:229.98ms step:5643/6710 train_time:1297810ms step_avg:229.99ms step:5644/6710 train_time:1298051ms step_avg:229.99ms step:5645/6710 train_time:1298290ms step_avg:229.99ms step:5646/6710 train_time:1298529ms step_avg:229.99ms step:5647/6710 train_time:1298771ms step_avg:229.99ms step:5648/6710 train_time:1299010ms step_avg:229.99ms step:5649/6710 train_time:1299249ms step_avg:230.00ms step:5650/6710 train_time:1299490ms step_avg:230.00ms step:5651/6710 train_time:1299733ms step_avg:230.00ms step:5652/6710 train_time:1299975ms step_avg:230.00ms step:5653/6710 train_time:1300216ms step_avg:230.00ms step:5654/6710 train_time:1300461ms step_avg:230.01ms step:5655/6710 train_time:1300700ms step_avg:230.01ms step:5656/6710 train_time:1300942ms step_avg:230.01ms step:5657/6710 train_time:1301185ms step_avg:230.01ms step:5658/6710 train_time:1301434ms step_avg:230.02ms step:5659/6710 train_time:1301684ms step_avg:230.02ms step:5660/6710 train_time:1301925ms step_avg:230.02ms step:5661/6710 train_time:1302166ms step_avg:230.02ms step:5662/6710 train_time:1302410ms step_avg:230.03ms step:5663/6710 train_time:1302651ms step_avg:230.03ms step:5664/6710 train_time:1302892ms step_avg:230.03ms step:5665/6710 train_time:1303134ms step_avg:230.03ms step:5666/6710 train_time:1303378ms step_avg:230.03ms step:5667/6710 train_time:1303619ms step_avg:230.04ms step:5668/6710 train_time:1303862ms step_avg:230.04ms step:5669/6710 train_time:1304102ms step_avg:230.04ms step:5670/6710 train_time:1304343ms step_avg:230.04ms step:5671/6710 train_time:1304585ms step_avg:230.05ms step:5672/6710 train_time:1304832ms step_avg:230.05ms step:5673/6710 train_time:1305073ms step_avg:230.05ms step:5674/6710 train_time:1305319ms step_avg:230.05ms step:5675/6710 train_time:1305557ms step_avg:230.05ms step:5676/6710 train_time:1305799ms step_avg:230.06ms step:5677/6710 train_time:1306041ms step_avg:230.06ms step:5678/6710 train_time:1306281ms step_avg:230.06ms step:5679/6710 train_time:1306523ms step_avg:230.06ms step:5680/6710 train_time:1306766ms step_avg:230.06ms step:5681/6710 train_time:1307009ms step_avg:230.07ms step:5682/6710 train_time:1307251ms step_avg:230.07ms step:5683/6710 train_time:1307492ms step_avg:230.07ms step:5684/6710 train_time:1307732ms step_avg:230.07ms step:5685/6710 train_time:1307971ms step_avg:230.07ms step:5686/6710 train_time:1308211ms step_avg:230.08ms step:5687/6710 train_time:1308455ms step_avg:230.08ms step:5688/6710 train_time:1308693ms step_avg:230.08ms step:5689/6710 train_time:1308932ms step_avg:230.08ms step:5690/6710 train_time:1309173ms step_avg:230.08ms step:5691/6710 train_time:1309412ms step_avg:230.08ms step:5692/6710 train_time:1309655ms step_avg:230.09ms step:5693/6710 train_time:1309895ms step_avg:230.09ms step:5694/6710 train_time:1310137ms step_avg:230.09ms step:5695/6710 train_time:1310378ms step_avg:230.09ms step:5696/6710 train_time:1310618ms step_avg:230.09ms step:5697/6710 train_time:1310859ms step_avg:230.10ms step:5698/6710 train_time:1311098ms step_avg:230.10ms step:5699/6710 train_time:1311338ms step_avg:230.10ms step:5700/6710 train_time:1311580ms step_avg:230.10ms step:5701/6710 train_time:1311820ms step_avg:230.10ms step:5702/6710 train_time:1312064ms step_avg:230.11ms step:5703/6710 train_time:1312310ms step_avg:230.11ms step:5704/6710 train_time:1312551ms step_avg:230.11ms step:5705/6710 train_time:1312790ms step_avg:230.11ms step:5706/6710 train_time:1313031ms step_avg:230.11ms step:5707/6710 train_time:1313272ms step_avg:230.12ms step:5708/6710 train_time:1313515ms step_avg:230.12ms step:5709/6710 train_time:1313756ms step_avg:230.12ms step:5710/6710 train_time:1313997ms step_avg:230.12ms step:5711/6710 train_time:1314243ms step_avg:230.12ms step:5712/6710 train_time:1314484ms step_avg:230.13ms step:5713/6710 train_time:1314728ms step_avg:230.13ms step:5714/6710 train_time:1314971ms step_avg:230.13ms step:5715/6710 train_time:1315213ms step_avg:230.13ms step:5716/6710 train_time:1315454ms step_avg:230.14ms step:5717/6710 train_time:1315698ms step_avg:230.14ms step:5718/6710 train_time:1315939ms step_avg:230.14ms step:5719/6710 train_time:1316181ms step_avg:230.14ms step:5720/6710 train_time:1316424ms step_avg:230.14ms step:5721/6710 train_time:1316668ms step_avg:230.15ms step:5722/6710 train_time:1316911ms step_avg:230.15ms step:5723/6710 train_time:1317152ms step_avg:230.15ms step:5724/6710 train_time:1317395ms step_avg:230.15ms step:5725/6710 train_time:1317643ms step_avg:230.16ms step:5726/6710 train_time:1317886ms step_avg:230.16ms step:5727/6710 train_time:1318126ms step_avg:230.16ms step:5728/6710 train_time:1318368ms step_avg:230.16ms step:5729/6710 train_time:1318607ms step_avg:230.16ms step:5730/6710 train_time:1318849ms step_avg:230.17ms step:5731/6710 train_time:1319089ms step_avg:230.17ms step:5732/6710 train_time:1319333ms step_avg:230.17ms step:5733/6710 train_time:1319574ms step_avg:230.17ms step:5734/6710 train_time:1319814ms step_avg:230.17ms step:5735/6710 train_time:1320056ms step_avg:230.18ms step:5736/6710 train_time:1320294ms step_avg:230.18ms step:5737/6710 train_time:1320536ms step_avg:230.18ms step:5738/6710 train_time:1320776ms step_avg:230.18ms step:5739/6710 train_time:1321015ms step_avg:230.18ms step:5740/6710 train_time:1321258ms step_avg:230.18ms step:5741/6710 train_time:1321499ms step_avg:230.19ms step:5742/6710 train_time:1321741ms step_avg:230.19ms step:5743/6710 train_time:1321982ms step_avg:230.19ms step:5744/6710 train_time:1322223ms step_avg:230.19ms step:5745/6710 train_time:1322462ms step_avg:230.19ms step:5746/6710 train_time:1322705ms step_avg:230.20ms step:5747/6710 train_time:1322945ms step_avg:230.20ms step:5748/6710 train_time:1323188ms step_avg:230.20ms step:5749/6710 train_time:1323432ms step_avg:230.20ms step:5750/6710 train_time:1323676ms step_avg:230.20ms step:5750/6710 val_loss:2.965373 train_time:1323865ms step_avg:230.24ms Parameter containing: tensor([1.0000, 1.0000, 0.4051, 1.0000, 0.4827, 1.0000, 0.3810, 1.0000], device='cuda:0', requires_grad=True) 0 [7.0314741134643555, 6.031472206115723] 1 [0.48267191648483276, 5.300169467926025] 2 [0.6165692806243896, 3.0301899909973145] 3 [0.6792068481445312, 2.580364942550659] 4 [0.40931060910224915, 1.9483461380004883] 5 [0.6027792096138, 2.500783920288086] 6 [0.515747606754303, 1.5968482494354248] 7 [0.6750012636184692, 4.374632358551025] 8 [0.4895232319831848, 0.09359093755483627] 9 [0.4884185194969177, 1.3397151231765747] 10 [0.6211040019989014, 1.8917174339294434] 11 [0.45962825417518616, 1.9873944520950317] 12 [0.8563240766525269, 5.132733345031738] 13 [0.9307145476341248, 2.7277536392211914] 14 [0.9218222498893738, 0.7549976110458374] 15 [0.8877795338630676, -0.3526320457458496] 0 [13.067646980285645, 20.46051788330078, 27.353364944458008] 1 [23.628887176513672, 21.541057586669922, 57.433746337890625] 2 [46.476844787597656, 16.78570556640625, 23.050678253173828] 3 [43.53470993041992, 21.944345474243164, 27.22372817993164] 4 [28.00074577331543, 20.69801139831543, 24.96300506591797] 5 [33.25343704223633, 19.727506637573242, 30.091524124145508] 6 [31.753692626953125, 22.513587951660156, 23.208242416381836] 7 [39.12025833129883, 0.0, 31.545732498168945] 8 [28.64665985107422, 22.382680892944336, 34.587379455566406] 9 [38.874271392822266, 19.619098663330078, 28.489391326904297] 10 [50.99182891845703, 20.91455078125, 28.320486068725586] 11 [43.184078216552734, 25.66851806640625, 18.101776123046875] 12 [60.50731658935547, 21.389753341674805, 18.697349548339844] 13 [76.02520751953125, 14.712955474853516, 20.706409454345703] 14 [82.07556915283203, 17.0531005859375, 27.21541976928711] 15 [86.89371490478516, 60.64592742919922, 97.0982666015625] step:5751/6710 train_time:1323917ms step_avg:230.21ms step:5752/6710 train_time:1324155ms step_avg:230.21ms step:5753/6710 train_time:1324397ms step_avg:230.21ms step:5754/6710 train_time:1324636ms step_avg:230.21ms step:5755/6710 train_time:1324880ms step_avg:230.21ms step:5756/6710 train_time:1325124ms step_avg:230.22ms step:5757/6710 train_time:1325370ms step_avg:230.22ms step:5758/6710 train_time:1325610ms step_avg:230.22ms step:5759/6710 train_time:1325849ms step_avg:230.22ms step:5760/6710 train_time:1326094ms step_avg:230.22ms step:5761/6710 train_time:1326339ms step_avg:230.23ms step:5762/6710 train_time:1326580ms step_avg:230.23ms step:5763/6710 train_time:1326823ms step_avg:230.23ms step:5764/6710 train_time:1327064ms step_avg:230.23ms step:5765/6710 train_time:1327304ms step_avg:230.23ms step:5766/6710 train_time:1327548ms step_avg:230.24ms step:5767/6710 train_time:1327786ms step_avg:230.24ms step:5768/6710 train_time:1328026ms step_avg:230.24ms step:5769/6710 train_time:1328270ms step_avg:230.24ms step:5770/6710 train_time:1328511ms step_avg:230.24ms step:5771/6710 train_time:1328751ms step_avg:230.25ms step:5772/6710 train_time:1328990ms step_avg:230.25ms step:5773/6710 train_time:1329234ms step_avg:230.25ms step:5774/6710 train_time:1329474ms step_avg:230.25ms step:5775/6710 train_time:1329714ms step_avg:230.25ms step:5776/6710 train_time:1329954ms step_avg:230.26ms step:5777/6710 train_time:1330195ms step_avg:230.26ms step:5778/6710 train_time:1330437ms step_avg:230.26ms step:5779/6710 train_time:1330681ms step_avg:230.26ms step:5780/6710 train_time:1330924ms step_avg:230.26ms step:5781/6710 train_time:1331165ms step_avg:230.27ms step:5782/6710 train_time:1331404ms step_avg:230.27ms step:5783/6710 train_time:1331645ms step_avg:230.27ms step:5784/6710 train_time:1331888ms step_avg:230.27ms step:5785/6710 train_time:1332129ms step_avg:230.27ms step:5786/6710 train_time:1332367ms step_avg:230.27ms step:5787/6710 train_time:1332608ms step_avg:230.28ms step:5788/6710 train_time:1332852ms step_avg:230.28ms step:5789/6710 train_time:1333089ms step_avg:230.28ms step:5790/6710 train_time:1333330ms step_avg:230.28ms step:5791/6710 train_time:1333572ms step_avg:230.28ms step:5792/6710 train_time:1333813ms step_avg:230.29ms step:5793/6710 train_time:1334052ms step_avg:230.29ms step:5794/6710 train_time:1334293ms step_avg:230.29ms step:5795/6710 train_time:1334534ms step_avg:230.29ms step:5796/6710 train_time:1334779ms step_avg:230.29ms step:5797/6710 train_time:1335019ms step_avg:230.29ms step:5798/6710 train_time:1335267ms step_avg:230.30ms step:5799/6710 train_time:1335508ms step_avg:230.30ms step:5800/6710 train_time:1335747ms step_avg:230.30ms step:5801/6710 train_time:1335987ms step_avg:230.30ms step:5802/6710 train_time:1336226ms step_avg:230.30ms step:5803/6710 train_time:1336467ms step_avg:230.31ms step:5804/6710 train_time:1336706ms step_avg:230.31ms step:5805/6710 train_time:1336945ms step_avg:230.31ms step:5806/6710 train_time:1337191ms step_avg:230.31ms step:5807/6710 train_time:1337430ms step_avg:230.31ms step:5808/6710 train_time:1337670ms step_avg:230.32ms step:5809/6710 train_time:1337912ms step_avg:230.32ms step:5810/6710 train_time:1338159ms step_avg:230.32ms step:5811/6710 train_time:1338398ms step_avg:230.32ms step:5812/6710 train_time:1338640ms step_avg:230.32ms step:5813/6710 train_time:1338879ms step_avg:230.33ms step:5814/6710 train_time:1339122ms step_avg:230.33ms step:5815/6710 train_time:1339366ms step_avg:230.33ms step:5816/6710 train_time:1339610ms step_avg:230.33ms step:5817/6710 train_time:1339849ms step_avg:230.33ms step:5818/6710 train_time:1340087ms step_avg:230.33ms step:5819/6710 train_time:1340334ms step_avg:230.34ms step:5820/6710 train_time:1340575ms step_avg:230.34ms step:5821/6710 train_time:1340815ms step_avg:230.34ms step:5822/6710 train_time:1341057ms step_avg:230.34ms step:5823/6710 train_time:1341303ms step_avg:230.35ms step:5824/6710 train_time:1341543ms step_avg:230.35ms step:5825/6710 train_time:1341783ms step_avg:230.35ms step:5826/6710 train_time:1342023ms step_avg:230.35ms step:5827/6710 train_time:1342264ms step_avg:230.35ms step:5828/6710 train_time:1342505ms step_avg:230.35ms step:5829/6710 train_time:1342747ms step_avg:230.36ms step:5830/6710 train_time:1342986ms step_avg:230.36ms step:5831/6710 train_time:1343227ms step_avg:230.36ms step:5832/6710 train_time:1343466ms step_avg:230.36ms step:5833/6710 train_time:1343712ms step_avg:230.36ms step:5834/6710 train_time:1343957ms step_avg:230.37ms step:5835/6710 train_time:1344194ms step_avg:230.37ms step:5836/6710 train_time:1344436ms step_avg:230.37ms step:5837/6710 train_time:1344678ms step_avg:230.37ms step:5838/6710 train_time:1344917ms step_avg:230.37ms step:5839/6710 train_time:1345157ms step_avg:230.37ms step:5840/6710 train_time:1345399ms step_avg:230.38ms step:5841/6710 train_time:1345641ms step_avg:230.38ms step:5842/6710 train_time:1345883ms step_avg:230.38ms step:5843/6710 train_time:1346126ms step_avg:230.38ms step:5844/6710 train_time:1346368ms step_avg:230.38ms step:5845/6710 train_time:1346608ms step_avg:230.39ms step:5846/6710 train_time:1346852ms step_avg:230.39ms step:5847/6710 train_time:1347094ms step_avg:230.39ms step:5848/6710 train_time:1347342ms step_avg:230.39ms step:5849/6710 train_time:1347581ms step_avg:230.40ms step:5850/6710 train_time:1347823ms step_avg:230.40ms step:5851/6710 train_time:1348070ms step_avg:230.40ms step:5852/6710 train_time:1348311ms step_avg:230.40ms step:5853/6710 train_time:1348552ms step_avg:230.40ms step:5854/6710 train_time:1348792ms step_avg:230.41ms step:5855/6710 train_time:1349032ms step_avg:230.41ms step:5856/6710 train_time:1349274ms step_avg:230.41ms step:5857/6710 train_time:1349516ms step_avg:230.41ms step:5858/6710 train_time:1349757ms step_avg:230.41ms step:5859/6710 train_time:1350002ms step_avg:230.42ms step:5860/6710 train_time:1350244ms step_avg:230.42ms step:5861/6710 train_time:1350492ms step_avg:230.42ms step:5862/6710 train_time:1350730ms step_avg:230.42ms step:5863/6710 train_time:1350971ms step_avg:230.42ms step:5864/6710 train_time:1351214ms step_avg:230.43ms step:5865/6710 train_time:1351457ms step_avg:230.43ms step:5866/6710 train_time:1351697ms step_avg:230.43ms step:5867/6710 train_time:1351938ms step_avg:230.43ms step:5868/6710 train_time:1352181ms step_avg:230.43ms step:5869/6710 train_time:1352421ms step_avg:230.43ms step:5870/6710 train_time:1352666ms step_avg:230.44ms step:5871/6710 train_time:1352908ms step_avg:230.44ms step:5872/6710 train_time:1353153ms step_avg:230.44ms step:5873/6710 train_time:1353394ms step_avg:230.44ms step:5874/6710 train_time:1353636ms step_avg:230.45ms step:5875/6710 train_time:1353876ms step_avg:230.45ms step:5875/6710 val_loss:2.958442 train_time:1354067ms step_avg:230.48ms Parameter containing: tensor([1.0000, 1.0000, 0.4040, 1.0000, 0.4736, 1.0000, 0.3771, 1.0000], device='cuda:0', requires_grad=True) 0 [6.959709167480469, 5.959707260131836] 1 [0.48238223791122437, 5.208357810974121] 2 [0.6102612018585205, 2.9437639713287354] 3 [0.6808334589004517, 2.5144522190093994] 4 [0.40963315963745117, 1.8828250169754028] 5 [0.595615029335022, 2.4135031700134277] 6 [0.520124614238739, 1.5405956506729126] 7 [0.6745418906211853, 4.294164657592773] 8 [0.49056828022003174, 0.039011068642139435] 9 [0.49050137400627136, 1.291703462600708] 10 [0.620217502117157, 1.8473800420761108] 11 [0.46329376101493835, 1.9282519817352295] 12 [0.8529780507087708, 5.051567554473877] 13 [0.9229364991188049, 2.6915671825408936] 14 [0.9226366281509399, 0.7306663990020752] 15 [0.8921334147453308, -0.3797159492969513] 0 [12.92402172088623, 20.02634620666504, 26.86727523803711] 1 [23.1839599609375, 21.113710403442383, 56.90998840332031] 2 [45.3594856262207, 16.35187339782715, 22.84426498413086] 3 [42.677059173583984, 21.428390502929688, 26.737281799316406] 4 [27.47391128540039, 20.312639236450195, 24.698148727416992] 5 [32.311256408691406, 19.323089599609375, 29.436975479125977] 6 [31.17278289794922, 22.001893997192383, 22.867656707763672] 7 [38.291954040527344, 0.0, 30.925762176513672] 8 [28.094627380371094, 21.859432220458984, 34.15853500366211] 9 [38.20671081542969, 19.273923873901367, 28.278762817382812] 10 [49.91441345214844, 20.474376678466797, 28.016395568847656] 11 [42.64276123046875, 25.17499542236328, 17.910877227783203] 12 [59.39912414550781, 20.98900032043457, 18.5151309967041] 13 [74.03594970703125, 14.37484359741211, 20.356212615966797] 14 [80.10809326171875, 16.635215759277344, 26.813295364379883] 15 [85.33990478515625, 59.376251220703125, 95.29851531982422] step:5876/6710 train_time:1354120ms step_avg:230.45ms step:5877/6710 train_time:1354361ms step_avg:230.45ms step:5878/6710 train_time:1354606ms step_avg:230.45ms step:5879/6710 train_time:1354847ms step_avg:230.46ms step:5880/6710 train_time:1355090ms step_avg:230.46ms step:5881/6710 train_time:1355331ms step_avg:230.46ms step:5882/6710 train_time:1355580ms step_avg:230.46ms step:5883/6710 train_time:1355816ms step_avg:230.46ms step:5884/6710 train_time:1356059ms step_avg:230.47ms step:5885/6710 train_time:1356299ms step_avg:230.47ms step:5886/6710 train_time:1356542ms step_avg:230.47ms step:5887/6710 train_time:1356785ms step_avg:230.47ms step:5888/6710 train_time:1357024ms step_avg:230.47ms step:5889/6710 train_time:1357265ms step_avg:230.47ms step:5890/6710 train_time:1357508ms step_avg:230.48ms step:5891/6710 train_time:1357753ms step_avg:230.48ms step:5892/6710 train_time:1357993ms step_avg:230.48ms step:5893/6710 train_time:1358232ms step_avg:230.48ms step:5894/6710 train_time:1358472ms step_avg:230.48ms step:5895/6710 train_time:1358715ms step_avg:230.49ms step:5896/6710 train_time:1358958ms step_avg:230.49ms step:5897/6710 train_time:1359199ms step_avg:230.49ms step:5898/6710 train_time:1359438ms step_avg:230.49ms step:5899/6710 train_time:1359681ms step_avg:230.49ms step:5900/6710 train_time:1359922ms step_avg:230.50ms step:5901/6710 train_time:1360159ms step_avg:230.50ms step:5902/6710 train_time:1360401ms step_avg:230.50ms step:5903/6710 train_time:1360641ms step_avg:230.50ms step:5904/6710 train_time:1360882ms step_avg:230.50ms step:5905/6710 train_time:1361122ms step_avg:230.50ms step:5906/6710 train_time:1361362ms step_avg:230.50ms step:5907/6710 train_time:1361601ms step_avg:230.51ms step:5908/6710 train_time:1361844ms step_avg:230.51ms step:5909/6710 train_time:1362086ms step_avg:230.51ms step:5910/6710 train_time:1362325ms step_avg:230.51ms step:5911/6710 train_time:1362568ms step_avg:230.51ms step:5912/6710 train_time:1362808ms step_avg:230.52ms step:5913/6710 train_time:1363047ms step_avg:230.52ms step:5914/6710 train_time:1363300ms step_avg:230.52ms step:5915/6710 train_time:1363541ms step_avg:230.52ms step:5916/6710 train_time:1363781ms step_avg:230.52ms step:5917/6710 train_time:1364022ms step_avg:230.53ms step:5918/6710 train_time:1364262ms step_avg:230.53ms step:5919/6710 train_time:1364501ms step_avg:230.53ms step:5920/6710 train_time:1364743ms step_avg:230.53ms step:5921/6710 train_time:1364982ms step_avg:230.53ms step:5922/6710 train_time:1365227ms step_avg:230.53ms step:5923/6710 train_time:1365467ms step_avg:230.54ms step:5924/6710 train_time:1365709ms step_avg:230.54ms step:5925/6710 train_time:1365951ms step_avg:230.54ms step:5926/6710 train_time:1366191ms step_avg:230.54ms step:5927/6710 train_time:1366433ms step_avg:230.54ms step:5928/6710 train_time:1366680ms step_avg:230.55ms step:5929/6710 train_time:1366923ms step_avg:230.55ms step:5930/6710 train_time:1367164ms step_avg:230.55ms step:5931/6710 train_time:1367408ms step_avg:230.55ms step:5932/6710 train_time:1367648ms step_avg:230.55ms step:5933/6710 train_time:1367889ms step_avg:230.56ms step:5934/6710 train_time:1368136ms step_avg:230.56ms step:5935/6710 train_time:1368376ms step_avg:230.56ms step:5936/6710 train_time:1368615ms step_avg:230.56ms step:5937/6710 train_time:1368854ms step_avg:230.56ms step:5938/6710 train_time:1369098ms step_avg:230.57ms step:5939/6710 train_time:1369341ms step_avg:230.57ms step:5940/6710 train_time:1369581ms step_avg:230.57ms step:5941/6710 train_time:1369826ms step_avg:230.57ms step:5942/6710 train_time:1370070ms step_avg:230.57ms step:5943/6710 train_time:1370314ms step_avg:230.58ms step:5944/6710 train_time:1370554ms step_avg:230.58ms step:5945/6710 train_time:1370796ms step_avg:230.58ms step:5946/6710 train_time:1371038ms step_avg:230.58ms step:5947/6710 train_time:1371281ms step_avg:230.58ms step:5948/6710 train_time:1371519ms step_avg:230.58ms step:5949/6710 train_time:1371764ms step_avg:230.59ms step:5950/6710 train_time:1372003ms step_avg:230.59ms step:5951/6710 train_time:1372245ms step_avg:230.59ms step:5952/6710 train_time:1372484ms step_avg:230.59ms step:5953/6710 train_time:1372728ms step_avg:230.59ms step:5954/6710 train_time:1372970ms step_avg:230.60ms step:5955/6710 train_time:1373211ms step_avg:230.60ms step:5956/6710 train_time:1373451ms step_avg:230.60ms step:5957/6710 train_time:1373696ms step_avg:230.60ms step:5958/6710 train_time:1373934ms step_avg:230.60ms step:5959/6710 train_time:1374175ms step_avg:230.61ms step:5960/6710 train_time:1374418ms step_avg:230.61ms step:5961/6710 train_time:1374663ms step_avg:230.61ms step:5962/6710 train_time:1374908ms step_avg:230.61ms step:5963/6710 train_time:1375149ms step_avg:230.61ms step:5964/6710 train_time:1375389ms step_avg:230.62ms step:5965/6710 train_time:1375632ms step_avg:230.62ms step:5966/6710 train_time:1375874ms step_avg:230.62ms step:5967/6710 train_time:1376117ms step_avg:230.62ms step:5968/6710 train_time:1376356ms step_avg:230.62ms step:5969/6710 train_time:1376599ms step_avg:230.62ms step:5970/6710 train_time:1376840ms step_avg:230.63ms step:5971/6710 train_time:1377085ms step_avg:230.63ms step:5972/6710 train_time:1377327ms step_avg:230.63ms step:5973/6710 train_time:1377570ms step_avg:230.63ms step:5974/6710 train_time:1377813ms step_avg:230.63ms step:5975/6710 train_time:1378053ms step_avg:230.64ms step:5976/6710 train_time:1378293ms step_avg:230.64ms step:5977/6710 train_time:1378538ms step_avg:230.64ms step:5978/6710 train_time:1378778ms step_avg:230.64ms step:5979/6710 train_time:1379018ms step_avg:230.64ms step:5980/6710 train_time:1379260ms step_avg:230.65ms step:5981/6710 train_time:1379500ms step_avg:230.65ms step:5982/6710 train_time:1379741ms step_avg:230.65ms step:5983/6710 train_time:1379985ms step_avg:230.65ms step:5984/6710 train_time:1380227ms step_avg:230.65ms step:5985/6710 train_time:1380468ms step_avg:230.65ms step:5986/6710 train_time:1380710ms step_avg:230.66ms step:5987/6710 train_time:1380954ms step_avg:230.66ms step:5988/6710 train_time:1381202ms step_avg:230.66ms step:5989/6710 train_time:1381447ms step_avg:230.66ms step:5990/6710 train_time:1381692ms step_avg:230.67ms step:5991/6710 train_time:1381930ms step_avg:230.67ms step:5992/6710 train_time:1382174ms step_avg:230.67ms step:5993/6710 train_time:1382418ms step_avg:230.67ms step:5994/6710 train_time:1382659ms step_avg:230.67ms step:5995/6710 train_time:1382901ms step_avg:230.68ms step:5996/6710 train_time:1383141ms step_avg:230.68ms step:5997/6710 train_time:1383383ms step_avg:230.68ms step:5998/6710 train_time:1383623ms step_avg:230.68ms step:5999/6710 train_time:1383864ms step_avg:230.68ms step:6000/6710 train_time:1384104ms step_avg:230.68ms step:6000/6710 val_loss:2.950933 train_time:1384293ms step_avg:230.72ms Parameter containing: tensor([1.0000, 1.0000, 0.4033, 1.0000, 0.4703, 1.0000, 0.3736, 1.0000], device='cuda:0', requires_grad=True) 0 [6.904695510864258, 5.904693603515625] 1 [0.48192164301872253, 5.108675956726074] 2 [0.6043202877044678, 2.849318027496338] 3 [0.6790720820426941, 2.438106060028076] 4 [0.4098162353038788, 1.836240291595459] 5 [0.5904350280761719, 2.3525912761688232] 6 [0.5198438167572021, 1.4954735040664673] 7 [0.674090564250946, 4.228857517242432] 8 [0.49270257353782654, 0.0004430157714523375] 9 [0.4904179275035858, 1.2603594064712524] 10 [0.6153350472450256, 1.7990376949310303] 11 [0.46269491314888, 1.8795480728149414] 12 [0.8521239757537842, 4.978277206420898] 13 [0.9177446961402893, 2.6444156169891357] 14 [0.918066680431366, 0.6881486177444458] 15 [0.8910989761352539, -0.41915518045425415] 0 [12.812752723693848, 19.66461944580078, 26.709739685058594] 1 [22.89697265625, 20.723125457763672, 55.75693893432617] 2 [44.1380615234375, 16.01694107055664, 22.193618774414062] 3 [41.47301483154297, 21.089365005493164, 26.024873733520508] 4 [26.761314392089844, 19.90692138671875, 24.408111572265625] 5 [31.385061264038086, 18.97095489501953, 29.131731033325195] 6 [30.523513793945312, 21.65496253967285, 22.5822811126709] 7 [37.58721923828125, 0.0, 30.37504768371582] 8 [27.70069122314453, 21.450489044189453, 33.368473052978516] 9 [37.408233642578125, 18.903282165527344, 27.905723571777344] 10 [48.49962615966797, 20.145618438720703, 27.56794548034668] 11 [41.544857025146484, 24.74480628967285, 17.72963523864746] 12 [58.098365783691406, 20.722604751586914, 18.254009246826172] 13 [72.23700714111328, 13.9601469039917, 19.9371280670166] 14 [77.8595962524414, 16.243667602539062, 26.142194747924805] 15 [82.9558334350586, 58.077030181884766, 92.39897155761719] step:6001/6710 train_time:1384345ms step_avg:230.69ms step:6002/6710 train_time:1384584ms step_avg:230.69ms step:6003/6710 train_time:1384830ms step_avg:230.69ms step:6004/6710 train_time:1385068ms step_avg:230.69ms step:6005/6710 train_time:1385312ms step_avg:230.69ms step:6006/6710 train_time:1385556ms step_avg:230.70ms step:6007/6710 train_time:1385798ms step_avg:230.70ms step:6008/6710 train_time:1386038ms step_avg:230.70ms step:6009/6710 train_time:1386283ms step_avg:230.70ms step:6010/6710 train_time:1386525ms step_avg:230.70ms step:6011/6710 train_time:1386769ms step_avg:230.71ms step:6012/6710 train_time:1387019ms step_avg:230.71ms step:6013/6710 train_time:1387261ms step_avg:230.71ms step:6014/6710 train_time:1387505ms step_avg:230.71ms step:6015/6710 train_time:1387751ms step_avg:230.72ms step:6016/6710 train_time:1387993ms step_avg:230.72ms step:6017/6710 train_time:1388232ms step_avg:230.72ms step:6018/6710 train_time:1388475ms step_avg:230.72ms step:6019/6710 train_time:1388719ms step_avg:230.72ms step:6020/6710 train_time:1388961ms step_avg:230.72ms step:6021/6710 train_time:1389203ms step_avg:230.73ms step:6022/6710 train_time:1389445ms step_avg:230.73ms step:6023/6710 train_time:1389685ms step_avg:230.73ms step:6024/6710 train_time:1389931ms step_avg:230.73ms step:6025/6710 train_time:1390175ms step_avg:230.73ms step:6026/6710 train_time:1390413ms step_avg:230.74ms step:6027/6710 train_time:1390653ms step_avg:230.74ms step:6028/6710 train_time:1390893ms step_avg:230.74ms step:6029/6710 train_time:1391134ms step_avg:230.74ms step:6030/6710 train_time:1391379ms step_avg:230.74ms step:6031/6710 train_time:1391624ms step_avg:230.75ms step:6032/6710 train_time:1391870ms step_avg:230.75ms step:6033/6710 train_time:1392114ms step_avg:230.75ms step:6034/6710 train_time:1392357ms step_avg:230.75ms step:6035/6710 train_time:1392604ms step_avg:230.75ms step:6036/6710 train_time:1392847ms step_avg:230.76ms step:6037/6710 train_time:1393088ms step_avg:230.76ms step:6038/6710 train_time:1393336ms step_avg:230.76ms step:6039/6710 train_time:1393574ms step_avg:230.76ms step:6040/6710 train_time:1393820ms step_avg:230.76ms step:6041/6710 train_time:1394062ms step_avg:230.77ms step:6042/6710 train_time:1394304ms step_avg:230.77ms step:6043/6710 train_time:1394545ms step_avg:230.77ms step:6044/6710 train_time:1394788ms step_avg:230.77ms step:6045/6710 train_time:1395033ms step_avg:230.77ms step:6046/6710 train_time:1395272ms step_avg:230.78ms step:6047/6710 train_time:1395514ms step_avg:230.78ms step:6048/6710 train_time:1395756ms step_avg:230.78ms step:6049/6710 train_time:1395995ms step_avg:230.78ms step:6050/6710 train_time:1396245ms step_avg:230.78ms step:6051/6710 train_time:1396488ms step_avg:230.79ms step:6052/6710 train_time:1396726ms step_avg:230.79ms step:6053/6710 train_time:1396970ms step_avg:230.79ms step:6054/6710 train_time:1397212ms step_avg:230.79ms step:6055/6710 train_time:1397458ms step_avg:230.79ms step:6056/6710 train_time:1397695ms step_avg:230.80ms step:6057/6710 train_time:1397943ms step_avg:230.80ms step:6058/6710 train_time:1398185ms step_avg:230.80ms step:6059/6710 train_time:1398431ms step_avg:230.80ms step:6060/6710 train_time:1398671ms step_avg:230.80ms step:6061/6710 train_time:1398912ms step_avg:230.81ms step:6062/6710 train_time:1399151ms step_avg:230.81ms step:6063/6710 train_time:1399395ms step_avg:230.81ms step:6064/6710 train_time:1399635ms step_avg:230.81ms step:6065/6710 train_time:1399879ms step_avg:230.81ms step:6066/6710 train_time:1400126ms step_avg:230.82ms step:6067/6710 train_time:1400367ms step_avg:230.82ms step:6068/6710 train_time:1400611ms step_avg:230.82ms step:6069/6710 train_time:1400853ms step_avg:230.82ms step:6070/6710 train_time:1401098ms step_avg:230.82ms step:6071/6710 train_time:1401337ms step_avg:230.82ms step:6072/6710 train_time:1401580ms step_avg:230.83ms step:6073/6710 train_time:1401820ms step_avg:230.83ms step:6074/6710 train_time:1402062ms step_avg:230.83ms step:6075/6710 train_time:1402307ms step_avg:230.83ms step:6076/6710 train_time:1402548ms step_avg:230.83ms step:6077/6710 train_time:1402789ms step_avg:230.84ms step:6078/6710 train_time:1403028ms step_avg:230.84ms step:6079/6710 train_time:1403270ms step_avg:230.84ms step:6080/6710 train_time:1403515ms step_avg:230.84ms step:6081/6710 train_time:1403755ms step_avg:230.84ms step:6082/6710 train_time:1403996ms step_avg:230.84ms step:6083/6710 train_time:1404243ms step_avg:230.85ms step:6084/6710 train_time:1404484ms step_avg:230.85ms step:6085/6710 train_time:1404726ms step_avg:230.85ms step:6086/6710 train_time:1404966ms step_avg:230.85ms step:6087/6710 train_time:1405211ms step_avg:230.85ms step:6088/6710 train_time:1405452ms step_avg:230.86ms step:6089/6710 train_time:1405693ms step_avg:230.86ms step:6090/6710 train_time:1405934ms step_avg:230.86ms step:6091/6710 train_time:1406179ms step_avg:230.86ms step:6092/6710 train_time:1406418ms step_avg:230.86ms step:6093/6710 train_time:1406659ms step_avg:230.86ms step:6094/6710 train_time:1406899ms step_avg:230.87ms step:6095/6710 train_time:1407150ms step_avg:230.87ms step:6096/6710 train_time:1407390ms step_avg:230.87ms step:6097/6710 train_time:1407630ms step_avg:230.87ms step:6098/6710 train_time:1407871ms step_avg:230.87ms step:6099/6710 train_time:1408114ms step_avg:230.88ms step:6100/6710 train_time:1408363ms step_avg:230.88ms step:6101/6710 train_time:1408602ms step_avg:230.88ms step:6102/6710 train_time:1408844ms step_avg:230.88ms step:6103/6710 train_time:1409087ms step_avg:230.88ms step:6104/6710 train_time:1409331ms step_avg:230.89ms step:6105/6710 train_time:1409572ms step_avg:230.89ms step:6106/6710 train_time:1409813ms step_avg:230.89ms step:6107/6710 train_time:1410061ms step_avg:230.89ms step:6108/6710 train_time:1410304ms step_avg:230.89ms step:6109/6710 train_time:1410550ms step_avg:230.90ms step:6110/6710 train_time:1410794ms step_avg:230.90ms step:6111/6710 train_time:1411036ms step_avg:230.90ms step:6112/6710 train_time:1411291ms step_avg:230.90ms step:6113/6710 train_time:1411532ms step_avg:230.91ms step:6114/6710 train_time:1411774ms step_avg:230.91ms step:6115/6710 train_time:1412021ms step_avg:230.91ms step:6116/6710 train_time:1412263ms step_avg:230.91ms step:6117/6710 train_time:1412501ms step_avg:230.91ms step:6118/6710 train_time:1412746ms step_avg:230.92ms step:6119/6710 train_time:1412988ms step_avg:230.92ms step:6120/6710 train_time:1413230ms step_avg:230.92ms step:6121/6710 train_time:1413470ms step_avg:230.92ms step:6122/6710 train_time:1413711ms step_avg:230.92ms step:6123/6710 train_time:1413952ms step_avg:230.92ms step:6124/6710 train_time:1414198ms step_avg:230.93ms step:6125/6710 train_time:1414448ms step_avg:230.93ms step:6125/6710 val_loss:2.943879 train_time:1414638ms step_avg:230.96ms Parameter containing: tensor([1.0000, 1.0000, 0.4045, 1.0000, 0.4682, 1.0000, 0.3670, 1.0000], device='cuda:0', requires_grad=True) 0 [6.840086460113525, 5.840084552764893] 1 [0.48165908455848694, 5.015054225921631] 2 [0.6007027626037598, 2.7690231800079346] 3 [0.6746870875358582, 2.3678205013275146] 4 [0.4101617634296417, 1.7766854763031006] 5 [0.5923664569854736, 2.2652413845062256] 6 [0.5165330767631531, 1.4289146661758423] 7 [0.6655552387237549, 4.162845611572266] 8 [0.4941892921924591, -0.04042432829737663] 9 [0.488747239112854, 1.2189005613327026] 10 [0.6152791380882263, 1.7515535354614258] 11 [0.462969571352005, 1.8133925199508667] 12 [0.8545764088630676, 4.894193649291992] 13 [0.9153841137886047, 2.5971426963806152] 14 [0.9154993295669556, 0.659492015838623] 15 [0.8897273540496826, -0.4506281912326813] 0 [12.684314727783203, 19.29776382446289, 26.695770263671875] 1 [22.64055061340332, 20.23110580444336, 55.36742401123047] 2 [43.45186233520508, 15.551725387573242, 21.76962661743164] 3 [40.410308837890625, 20.64081573486328, 25.625030517578125] 4 [26.146045684814453, 19.478683471679688, 24.224456787109375] 5 [30.886995315551758, 18.595449447631836, 28.7592830657959] 6 [29.854291915893555, 21.23850440979004, 22.47332000732422] 7 [36.49687957763672, 0.0, 30.11082649230957] 8 [27.200868606567383, 21.08005714416504, 32.94463348388672] 9 [36.50294494628906, 18.48750877380371, 27.475475311279297] 10 [47.385162353515625, 19.768383026123047, 27.214351654052734] 11 [40.729549407958984, 24.26506996154785, 17.557628631591797] 12 [57.151302337646484, 20.36566162109375, 18.180070877075195] 13 [70.90326690673828, 13.75167179107666, 19.726917266845703] 14 [76.28632354736328, 15.895337104797363, 25.72590446472168] 15 [81.19574737548828, 56.966957092285156, 90.20414733886719] step:6126/6710 train_time:1414693ms step_avg:230.93ms step:6127/6710 train_time:1414938ms step_avg:230.93ms step:6128/6710 train_time:1415183ms step_avg:230.94ms step:6129/6710 train_time:1415425ms step_avg:230.94ms step:6130/6710 train_time:1415671ms step_avg:230.94ms step:6131/6710 train_time:1415916ms step_avg:230.94ms step:6132/6710 train_time:1416164ms step_avg:230.95ms step:6133/6710 train_time:1416406ms step_avg:230.95ms step:6134/6710 train_time:1416647ms step_avg:230.95ms step:6135/6710 train_time:1416891ms step_avg:230.95ms step:6136/6710 train_time:1417133ms step_avg:230.95ms step:6137/6710 train_time:1417374ms step_avg:230.96ms step:6138/6710 train_time:1417616ms step_avg:230.96ms step:6139/6710 train_time:1417856ms step_avg:230.96ms step:6140/6710 train_time:1418098ms step_avg:230.96ms step:6141/6710 train_time:1418340ms step_avg:230.96ms step:6142/6710 train_time:1418581ms step_avg:230.96ms step:6143/6710 train_time:1418824ms step_avg:230.97ms step:6144/6710 train_time:1419067ms step_avg:230.97ms step:6145/6710 train_time:1419314ms step_avg:230.97ms step:6146/6710 train_time:1419566ms step_avg:230.97ms step:6147/6710 train_time:1419808ms step_avg:230.98ms step:6148/6710 train_time:1420046ms step_avg:230.98ms step:6149/6710 train_time:1420286ms step_avg:230.98ms step:6150/6710 train_time:1420528ms step_avg:230.98ms step:6151/6710 train_time:1420771ms step_avg:230.98ms step:6152/6710 train_time:1421012ms step_avg:230.98ms step:6153/6710 train_time:1421252ms step_avg:230.99ms step:6154/6710 train_time:1421495ms step_avg:230.99ms step:6155/6710 train_time:1421736ms step_avg:230.99ms step:6156/6710 train_time:1421977ms step_avg:230.99ms step:6157/6710 train_time:1422219ms step_avg:230.99ms step:6158/6710 train_time:1422463ms step_avg:230.99ms step:6159/6710 train_time:1422701ms step_avg:231.00ms step:6160/6710 train_time:1422941ms step_avg:231.00ms step:6161/6710 train_time:1423181ms step_avg:231.00ms step:6162/6710 train_time:1423426ms step_avg:231.00ms step:6163/6710 train_time:1423667ms step_avg:231.00ms step:6164/6710 train_time:1423909ms step_avg:231.00ms step:6165/6710 train_time:1424152ms step_avg:231.01ms step:6166/6710 train_time:1424391ms step_avg:231.01ms step:6167/6710 train_time:1424631ms step_avg:231.01ms step:6168/6710 train_time:1424874ms step_avg:231.01ms step:6169/6710 train_time:1425120ms step_avg:231.01ms step:6170/6710 train_time:1425361ms step_avg:231.01ms step:6171/6710 train_time:1425600ms step_avg:231.02ms step:6172/6710 train_time:1425838ms step_avg:231.02ms step:6173/6710 train_time:1426078ms step_avg:231.02ms step:6174/6710 train_time:1426317ms step_avg:231.02ms step:6175/6710 train_time:1426557ms step_avg:231.02ms step:6176/6710 train_time:1426800ms step_avg:231.02ms step:6177/6710 train_time:1427041ms step_avg:231.02ms step:6178/6710 train_time:1427281ms step_avg:231.03ms step:6179/6710 train_time:1427522ms step_avg:231.03ms step:6180/6710 train_time:1427763ms step_avg:231.03ms step:6181/6710 train_time:1428002ms step_avg:231.03ms step:6182/6710 train_time:1428242ms step_avg:231.03ms step:6183/6710 train_time:1428486ms step_avg:231.03ms step:6184/6710 train_time:1428727ms step_avg:231.04ms step:6185/6710 train_time:1428968ms step_avg:231.04ms step:6186/6710 train_time:1429212ms step_avg:231.04ms step:6187/6710 train_time:1429453ms step_avg:231.04ms step:6188/6710 train_time:1429701ms step_avg:231.04ms step:6189/6710 train_time:1429942ms step_avg:231.05ms step:6190/6710 train_time:1430186ms step_avg:231.05ms step:6191/6710 train_time:1430425ms step_avg:231.05ms step:6192/6710 train_time:1430665ms step_avg:231.05ms step:6193/6710 train_time:1430908ms step_avg:231.05ms step:6194/6710 train_time:1431149ms step_avg:231.05ms step:6195/6710 train_time:1431389ms step_avg:231.06ms step:6196/6710 train_time:1431634ms step_avg:231.06ms step:6197/6710 train_time:1431874ms step_avg:231.06ms step:6198/6710 train_time:1432118ms step_avg:231.06ms step:6199/6710 train_time:1432362ms step_avg:231.06ms step:6200/6710 train_time:1432604ms step_avg:231.07ms step:6201/6710 train_time:1432841ms step_avg:231.07ms step:6202/6710 train_time:1433089ms step_avg:231.07ms step:6203/6710 train_time:1433329ms step_avg:231.07ms step:6204/6710 train_time:1433568ms step_avg:231.07ms step:6205/6710 train_time:1433808ms step_avg:231.07ms step:6206/6710 train_time:1434048ms step_avg:231.07ms step:6207/6710 train_time:1434289ms step_avg:231.08ms step:6208/6710 train_time:1434528ms step_avg:231.08ms step:6209/6710 train_time:1434768ms step_avg:231.08ms step:6210/6710 train_time:1435013ms step_avg:231.08ms step:6211/6710 train_time:1435256ms step_avg:231.08ms step:6212/6710 train_time:1435496ms step_avg:231.08ms step:6213/6710 train_time:1435738ms step_avg:231.09ms step:6214/6710 train_time:1435979ms step_avg:231.09ms step:6215/6710 train_time:1436221ms step_avg:231.09ms step:6216/6710 train_time:1436466ms step_avg:231.09ms step:6217/6710 train_time:1436707ms step_avg:231.09ms step:6218/6710 train_time:1436949ms step_avg:231.10ms step:6219/6710 train_time:1437190ms step_avg:231.10ms step:6220/6710 train_time:1437433ms step_avg:231.10ms step:6221/6710 train_time:1437677ms step_avg:231.10ms step:6222/6710 train_time:1437920ms step_avg:231.10ms step:6223/6710 train_time:1438162ms step_avg:231.10ms step:6224/6710 train_time:1438403ms step_avg:231.11ms step:6225/6710 train_time:1438645ms step_avg:231.11ms step:6226/6710 train_time:1438887ms step_avg:231.11ms step:6227/6710 train_time:1439129ms step_avg:231.11ms step:6228/6710 train_time:1439370ms step_avg:231.11ms step:6229/6710 train_time:1439611ms step_avg:231.11ms step:6230/6710 train_time:1439853ms step_avg:231.12ms step:6231/6710 train_time:1440095ms step_avg:231.12ms step:6232/6710 train_time:1440339ms step_avg:231.12ms step:6233/6710 train_time:1440581ms step_avg:231.12ms step:6234/6710 train_time:1440823ms step_avg:231.12ms step:6235/6710 train_time:1441066ms step_avg:231.13ms step:6236/6710 train_time:1441306ms step_avg:231.13ms step:6237/6710 train_time:1441546ms step_avg:231.13ms step:6238/6710 train_time:1441791ms step_avg:231.13ms step:6239/6710 train_time:1442034ms step_avg:231.13ms step:6240/6710 train_time:1442278ms step_avg:231.13ms step:6241/6710 train_time:1442518ms step_avg:231.14ms step:6242/6710 train_time:1442759ms step_avg:231.14ms step:6243/6710 train_time:1443003ms step_avg:231.14ms step:6244/6710 train_time:1443248ms step_avg:231.14ms step:6245/6710 train_time:1443488ms step_avg:231.14ms step:6246/6710 train_time:1443737ms step_avg:231.15ms step:6247/6710 train_time:1443977ms step_avg:231.15ms step:6248/6710 train_time:1444220ms step_avg:231.15ms step:6249/6710 train_time:1444462ms step_avg:231.15ms step:6250/6710 train_time:1444704ms step_avg:231.15ms step:6250/6710 val_loss:2.937172 train_time:1444896ms step_avg:231.18ms Parameter containing: tensor([1.0000, 1.0000, 0.4016, 1.0000, 0.4650, 1.0000, 0.3635, 1.0000], device='cuda:0', requires_grad=True) 0 [6.798734188079834, 5.798732280731201] 1 [0.47959405183792114, 4.9422688484191895] 2 [0.5926387310028076, 2.697317600250244] 3 [0.6748784780502319, 2.302654981613159] 4 [0.41026344895362854, 1.7370665073394775] 5 [0.5899282097816467, 2.2129428386688232] 6 [0.5207152962684631, 1.384256362915039] 7 [0.6628214716911316, 4.107271671295166] 8 [0.497097909450531, -0.08004341274499893] 9 [0.4890844225883484, 1.1769362688064575] 10 [0.6142629981040955, 1.7018383741378784] 11 [0.4626520872116089, 1.7670619487762451] 12 [0.8489891290664673, 4.83775520324707] 13 [0.9103706479072571, 2.561436414718628] 14 [0.9141433835029602, 0.6351068019866943] 15 [0.8920366168022156, -0.47087833285331726] 0 [12.599835395812988, 19.040884017944336, 26.18096351623535] 1 [22.226789474487305, 19.96710777282715, 54.235435485839844] 2 [42.023826599121094, 15.327770233154297, 21.563589096069336] 3 [39.41648483276367, 20.310789108276367, 25.436386108398438] 4 [25.68097496032715, 19.179868698120117, 23.905319213867188] 5 [30.279531478881836, 18.268512725830078, 28.30985450744629] 6 [29.533906936645508, 20.892276763916016, 22.177982330322266] 7 [35.85233688354492, 0.0, 29.502853393554688] 8 [26.831995010375977, 20.772905349731445, 32.47675323486328] 9 [35.934425354003906, 18.208240509033203, 27.057579040527344] 10 [46.50463104248047, 19.501855850219727, 26.71908187866211] 11 [39.8800048828125, 23.86643409729004, 17.350130081176758] 12 [55.76012420654297, 20.08049964904785, 17.951101303100586] 13 [69.02957916259766, 13.460749626159668, 19.436176300048828] 14 [74.31920623779297, 15.548028945922852, 25.359132766723633] 15 [79.4703140258789, 55.925567626953125, 87.75983428955078] step:6251/6710 train_time:1444948ms step_avg:231.15ms step:6252/6710 train_time:1445185ms step_avg:231.16ms step:6253/6710 train_time:1445442ms step_avg:231.16ms step:6254/6710 train_time:1445682ms step_avg:231.16ms step:6255/6710 train_time:1445923ms step_avg:231.16ms step:6256/6710 train_time:1446164ms step_avg:231.16ms step:6257/6710 train_time:1446408ms step_avg:231.17ms step:6258/6710 train_time:1446649ms step_avg:231.17ms step:6259/6710 train_time:1446895ms step_avg:231.17ms step:6260/6710 train_time:1447132ms step_avg:231.17ms step:6261/6710 train_time:1447382ms step_avg:231.17ms step:6262/6710 train_time:1447623ms step_avg:231.18ms step:6263/6710 train_time:1447865ms step_avg:231.18ms step:6264/6710 train_time:1448104ms step_avg:231.18ms step:6265/6710 train_time:1448346ms step_avg:231.18ms step:6266/6710 train_time:1448589ms step_avg:231.18ms step:6267/6710 train_time:1448831ms step_avg:231.18ms step:6268/6710 train_time:1449076ms step_avg:231.19ms step:6269/6710 train_time:1449317ms step_avg:231.19ms step:6270/6710 train_time:1449561ms step_avg:231.19ms step:6271/6710 train_time:1449803ms step_avg:231.19ms step:6272/6710 train_time:1450048ms step_avg:231.19ms step:6273/6710 train_time:1450289ms step_avg:231.20ms step:6274/6710 train_time:1450530ms step_avg:231.20ms step:6275/6710 train_time:1450769ms step_avg:231.20ms step:6276/6710 train_time:1451010ms step_avg:231.20ms step:6277/6710 train_time:1451253ms step_avg:231.20ms step:6278/6710 train_time:1451496ms step_avg:231.20ms step:6279/6710 train_time:1451739ms step_avg:231.21ms step:6280/6710 train_time:1451982ms step_avg:231.21ms step:6281/6710 train_time:1452220ms step_avg:231.21ms step:6282/6710 train_time:1452464ms step_avg:231.21ms step:6283/6710 train_time:1452705ms step_avg:231.21ms step:6284/6710 train_time:1452947ms step_avg:231.21ms step:6285/6710 train_time:1453185ms step_avg:231.21ms step:6286/6710 train_time:1453427ms step_avg:231.22ms step:6287/6710 train_time:1453670ms step_avg:231.22ms step:6288/6710 train_time:1453916ms step_avg:231.22ms step:6289/6710 train_time:1454156ms step_avg:231.22ms step:6290/6710 train_time:1454397ms step_avg:231.22ms step:6291/6710 train_time:1454639ms step_avg:231.23ms step:6292/6710 train_time:1454882ms step_avg:231.23ms step:6293/6710 train_time:1455125ms step_avg:231.23ms step:6294/6710 train_time:1455374ms step_avg:231.23ms step:6295/6710 train_time:1455615ms step_avg:231.23ms step:6296/6710 train_time:1455858ms step_avg:231.24ms step:6297/6710 train_time:1456097ms step_avg:231.24ms step:6298/6710 train_time:1456338ms step_avg:231.24ms step:6299/6710 train_time:1456577ms step_avg:231.24ms step:6300/6710 train_time:1456826ms step_avg:231.24ms step:6301/6710 train_time:1457067ms step_avg:231.24ms step:6302/6710 train_time:1457310ms step_avg:231.25ms step:6303/6710 train_time:1457548ms step_avg:231.25ms step:6304/6710 train_time:1457790ms step_avg:231.25ms step:6305/6710 train_time:1458032ms step_avg:231.25ms step:6306/6710 train_time:1458271ms step_avg:231.25ms step:6307/6710 train_time:1458517ms step_avg:231.25ms step:6308/6710 train_time:1458759ms step_avg:231.26ms step:6309/6710 train_time:1459000ms step_avg:231.26ms step:6310/6710 train_time:1459242ms step_avg:231.26ms step:6311/6710 train_time:1459485ms step_avg:231.26ms step:6312/6710 train_time:1459727ms step_avg:231.26ms step:6313/6710 train_time:1459969ms step_avg:231.26ms step:6314/6710 train_time:1460213ms step_avg:231.27ms step:6315/6710 train_time:1460454ms step_avg:231.27ms step:6316/6710 train_time:1460694ms step_avg:231.27ms step:6317/6710 train_time:1460937ms step_avg:231.27ms step:6318/6710 train_time:1461177ms step_avg:231.27ms step:6319/6710 train_time:1461418ms step_avg:231.27ms step:6320/6710 train_time:1461663ms step_avg:231.28ms step:6321/6710 train_time:1461908ms step_avg:231.28ms step:6322/6710 train_time:1462152ms step_avg:231.28ms step:6323/6710 train_time:1462394ms step_avg:231.28ms step:6324/6710 train_time:1462634ms step_avg:231.28ms step:6325/6710 train_time:1462877ms step_avg:231.28ms step:6326/6710 train_time:1463119ms step_avg:231.29ms step:6327/6710 train_time:1463365ms step_avg:231.29ms step:6328/6710 train_time:1463602ms step_avg:231.29ms step:6329/6710 train_time:1463845ms step_avg:231.29ms step:6330/6710 train_time:1464094ms step_avg:231.29ms step:6331/6710 train_time:1464334ms step_avg:231.30ms step:6332/6710 train_time:1464573ms step_avg:231.30ms step:6333/6710 train_time:1464814ms step_avg:231.30ms step:6334/6710 train_time:1465057ms step_avg:231.30ms step:6335/6710 train_time:1465300ms step_avg:231.30ms step:6336/6710 train_time:1465545ms step_avg:231.30ms step:6337/6710 train_time:1465787ms step_avg:231.31ms step:6338/6710 train_time:1466029ms step_avg:231.31ms step:6339/6710 train_time:1466272ms step_avg:231.31ms step:6340/6710 train_time:1466516ms step_avg:231.31ms step:6341/6710 train_time:1466755ms step_avg:231.31ms step:6342/6710 train_time:1467001ms step_avg:231.32ms step:6343/6710 train_time:1467245ms step_avg:231.32ms step:6344/6710 train_time:1467490ms step_avg:231.32ms step:6345/6710 train_time:1467732ms step_avg:231.32ms step:6346/6710 train_time:1467979ms step_avg:231.32ms step:6347/6710 train_time:1468218ms step_avg:231.32ms step:6348/6710 train_time:1468459ms step_avg:231.33ms step:6349/6710 train_time:1468699ms step_avg:231.33ms step:6350/6710 train_time:1468944ms step_avg:231.33ms step:6351/6710 train_time:1469186ms step_avg:231.33ms step:6352/6710 train_time:1469429ms step_avg:231.33ms step:6353/6710 train_time:1469668ms step_avg:231.33ms step:6354/6710 train_time:1469910ms step_avg:231.34ms step:6355/6710 train_time:1470153ms step_avg:231.34ms step:6356/6710 train_time:1470392ms step_avg:231.34ms step:6357/6710 train_time:1470635ms step_avg:231.34ms step:6358/6710 train_time:1470877ms step_avg:231.34ms step:6359/6710 train_time:1471119ms step_avg:231.34ms step:6360/6710 train_time:1471361ms step_avg:231.35ms step:6361/6710 train_time:1471601ms step_avg:231.35ms step:6362/6710 train_time:1471843ms step_avg:231.35ms step:6363/6710 train_time:1472083ms step_avg:231.35ms step:6364/6710 train_time:1472325ms step_avg:231.35ms step:6365/6710 train_time:1472569ms step_avg:231.35ms step:6366/6710 train_time:1472819ms step_avg:231.36ms step:6367/6710 train_time:1473061ms step_avg:231.36ms step:6368/6710 train_time:1473300ms step_avg:231.36ms step:6369/6710 train_time:1473540ms step_avg:231.36ms step:6370/6710 train_time:1473782ms step_avg:231.36ms step:6371/6710 train_time:1474023ms step_avg:231.36ms step:6372/6710 train_time:1474263ms step_avg:231.37ms step:6373/6710 train_time:1474504ms step_avg:231.37ms step:6374/6710 train_time:1474750ms step_avg:231.37ms step:6375/6710 train_time:1474995ms step_avg:231.37ms step:6375/6710 val_loss:2.930899 train_time:1475183ms step_avg:231.40ms Parameter containing: tensor([1.0000, 1.0000, 0.4026, 1.0000, 0.4616, 1.0000, 0.3586, 1.0000], device='cuda:0', requires_grad=True) 0 [6.762256622314453, 5.76225471496582] 1 [0.4795667231082916, 4.888319969177246] 2 [0.5853868722915649, 2.641792058944702] 3 [0.6748853921890259, 2.25907564163208] 4 [0.4102613031864166, 1.6989341974258423] 5 [0.5876464247703552, 2.1616268157958984] 6 [0.5188279747962952, 1.3481730222702026] 7 [0.6602962613105774, 4.0652055740356445] 8 [0.49273431301116943, -0.11542300879955292] 9 [0.4859302043914795, 1.1463793516159058] 10 [0.6118549108505249, 1.6701213121414185] 11 [0.4601714611053467, 1.7315430641174316] 12 [0.8519997000694275, 4.791487216949463] 13 [0.9108787775039673, 2.533935546875] 14 [0.9133723378181458, 0.6064876914024353] 15 [0.8913506865501404, -0.5011759996414185] 0 [12.526606559753418, 18.806228637695312, 26.0306396484375] 1 [22.033090591430664, 19.70437240600586, 53.85078048706055] 2 [41.16535949707031, 15.02949047088623, 21.35946273803711] 3 [38.70133590698242, 20.0129337310791, 25.30139923095703] 4 [25.31201934814453, 18.995723724365234, 23.829282760620117] 5 [29.86977195739746, 18.05109214782715, 28.045284271240234] 6 [29.068050384521484, 20.6637020111084, 21.941242218017578] 7 [35.23378372192383, 0.0, 29.124649047851562] 8 [26.1799373626709, 20.50486183166504, 32.230918884277344] 9 [35.070579528808594, 17.927860260009766, 26.8497314453125] 10 [45.48289108276367, 19.258861541748047, 26.504425048828125] 11 [38.99958419799805, 23.60753059387207, 17.161941528320312] 12 [54.978126525878906, 19.914196014404297, 17.78824806213379] 13 [68.19657897949219, 13.267997741699219, 19.20834732055664] 14 [73.36561584472656, 15.264827728271484, 24.989744186401367] 15 [78.38163757324219, 55.244773864746094, 86.13951873779297] step:6376/6710 train_time:1475235ms step_avg:231.37ms step:6377/6710 train_time:1475472ms step_avg:231.37ms step:6378/6710 train_time:1475719ms step_avg:231.38ms step:6379/6710 train_time:1475959ms step_avg:231.38ms step:6380/6710 train_time:1476200ms step_avg:231.38ms step:6381/6710 train_time:1476442ms step_avg:231.38ms step:6382/6710 train_time:1476684ms step_avg:231.38ms step:6383/6710 train_time:1476923ms step_avg:231.38ms step:6384/6710 train_time:1477171ms step_avg:231.39ms step:6385/6710 train_time:1477415ms step_avg:231.39ms step:6386/6710 train_time:1477655ms step_avg:231.39ms step:6387/6710 train_time:1477896ms step_avg:231.39ms step:6388/6710 train_time:1478136ms step_avg:231.39ms step:6389/6710 train_time:1478378ms step_avg:231.39ms step:6390/6710 train_time:1478618ms step_avg:231.40ms step:6391/6710 train_time:1478859ms step_avg:231.40ms step:6392/6710 train_time:1479099ms step_avg:231.40ms step:6393/6710 train_time:1479338ms step_avg:231.40ms step:6394/6710 train_time:1479589ms step_avg:231.40ms step:6395/6710 train_time:1479830ms step_avg:231.40ms step:6396/6710 train_time:1480075ms step_avg:231.41ms step:6397/6710 train_time:1480314ms step_avg:231.41ms step:6398/6710 train_time:1480556ms step_avg:231.41ms step:6399/6710 train_time:1480799ms step_avg:231.41ms step:6400/6710 train_time:1481044ms step_avg:231.41ms step:6401/6710 train_time:1481283ms step_avg:231.41ms step:6402/6710 train_time:1481525ms step_avg:231.42ms step:6403/6710 train_time:1481766ms step_avg:231.42ms step:6404/6710 train_time:1482010ms step_avg:231.42ms step:6405/6710 train_time:1482250ms step_avg:231.42ms step:6406/6710 train_time:1482495ms step_avg:231.42ms step:6407/6710 train_time:1482733ms step_avg:231.42ms step:6408/6710 train_time:1482978ms step_avg:231.43ms step:6409/6710 train_time:1483218ms step_avg:231.43ms step:6410/6710 train_time:1483460ms step_avg:231.43ms step:6411/6710 train_time:1483698ms step_avg:231.43ms step:6412/6710 train_time:1483943ms step_avg:231.43ms step:6413/6710 train_time:1484189ms step_avg:231.43ms step:6414/6710 train_time:1484432ms step_avg:231.44ms step:6415/6710 train_time:1484669ms step_avg:231.44ms step:6416/6710 train_time:1484912ms step_avg:231.44ms step:6417/6710 train_time:1485154ms step_avg:231.44ms step:6418/6710 train_time:1485396ms step_avg:231.44ms step:6419/6710 train_time:1485640ms step_avg:231.44ms step:6420/6710 train_time:1485878ms step_avg:231.45ms step:6421/6710 train_time:1486127ms step_avg:231.45ms step:6422/6710 train_time:1486369ms step_avg:231.45ms step:6423/6710 train_time:1486613ms step_avg:231.45ms step:6424/6710 train_time:1486855ms step_avg:231.45ms step:6425/6710 train_time:1487097ms step_avg:231.45ms step:6426/6710 train_time:1487339ms step_avg:231.46ms step:6427/6710 train_time:1487579ms step_avg:231.46ms step:6428/6710 train_time:1487820ms step_avg:231.46ms step:6429/6710 train_time:1488063ms step_avg:231.46ms step:6430/6710 train_time:1488308ms step_avg:231.46ms step:6431/6710 train_time:1488550ms step_avg:231.46ms step:6432/6710 train_time:1488790ms step_avg:231.47ms step:6433/6710 train_time:1489032ms step_avg:231.47ms step:6434/6710 train_time:1489273ms step_avg:231.47ms step:6435/6710 train_time:1489516ms step_avg:231.47ms step:6436/6710 train_time:1489757ms step_avg:231.47ms step:6437/6710 train_time:1489998ms step_avg:231.47ms step:6438/6710 train_time:1490240ms step_avg:231.48ms step:6439/6710 train_time:1490482ms step_avg:231.48ms step:6440/6710 train_time:1490725ms step_avg:231.48ms step:6441/6710 train_time:1490969ms step_avg:231.48ms step:6442/6710 train_time:1491210ms step_avg:231.48ms step:6443/6710 train_time:1491455ms step_avg:231.48ms step:6444/6710 train_time:1491697ms step_avg:231.49ms step:6445/6710 train_time:1491938ms step_avg:231.49ms step:6446/6710 train_time:1492181ms step_avg:231.49ms step:6447/6710 train_time:1492424ms step_avg:231.49ms step:6448/6710 train_time:1492665ms step_avg:231.49ms step:6449/6710 train_time:1492908ms step_avg:231.49ms step:6450/6710 train_time:1493146ms step_avg:231.50ms step:6451/6710 train_time:1493389ms step_avg:231.50ms step:6452/6710 train_time:1493632ms step_avg:231.50ms step:6453/6710 train_time:1493875ms step_avg:231.50ms step:6454/6710 train_time:1494115ms step_avg:231.50ms step:6455/6710 train_time:1494356ms step_avg:231.50ms step:6456/6710 train_time:1494605ms step_avg:231.51ms step:6457/6710 train_time:1494846ms step_avg:231.51ms step:6458/6710 train_time:1495094ms step_avg:231.51ms step:6459/6710 train_time:1495333ms step_avg:231.51ms step:6460/6710 train_time:1495576ms step_avg:231.51ms step:6461/6710 train_time:1495817ms step_avg:231.51ms step:6462/6710 train_time:1496060ms step_avg:231.52ms step:6463/6710 train_time:1496301ms step_avg:231.52ms step:6464/6710 train_time:1496548ms step_avg:231.52ms step:6465/6710 train_time:1496791ms step_avg:231.52ms step:6466/6710 train_time:1497038ms step_avg:231.52ms step:6467/6710 train_time:1497283ms step_avg:231.53ms step:6468/6710 train_time:1497524ms step_avg:231.53ms step:6469/6710 train_time:1497767ms step_avg:231.53ms step:6470/6710 train_time:1498019ms step_avg:231.53ms step:6471/6710 train_time:1498263ms step_avg:231.53ms step:6472/6710 train_time:1498505ms step_avg:231.54ms step:6473/6710 train_time:1498748ms step_avg:231.54ms step:6474/6710 train_time:1498992ms step_avg:231.54ms step:6475/6710 train_time:1499236ms step_avg:231.54ms step:6476/6710 train_time:1499483ms step_avg:231.54ms step:6477/6710 train_time:1499733ms step_avg:231.55ms step:6478/6710 train_time:1499976ms step_avg:231.55ms step:6479/6710 train_time:1500221ms step_avg:231.55ms step:6480/6710 train_time:1500463ms step_avg:231.55ms step:6481/6710 train_time:1500706ms step_avg:231.55ms step:6482/6710 train_time:1500950ms step_avg:231.56ms step:6483/6710 train_time:1501193ms step_avg:231.56ms step:6484/6710 train_time:1501441ms step_avg:231.56ms step:6485/6710 train_time:1501682ms step_avg:231.56ms step:6486/6710 train_time:1501927ms step_avg:231.56ms step:6487/6710 train_time:1502173ms step_avg:231.57ms step:6488/6710 train_time:1502418ms step_avg:231.57ms step:6489/6710 train_time:1502661ms step_avg:231.57ms step:6490/6710 train_time:1502905ms step_avg:231.57ms step:6491/6710 train_time:1503147ms step_avg:231.57ms step:6492/6710 train_time:1503394ms step_avg:231.58ms step:6493/6710 train_time:1503635ms step_avg:231.58ms step:6494/6710 train_time:1503882ms step_avg:231.58ms step:6495/6710 train_time:1504123ms step_avg:231.58ms step:6496/6710 train_time:1504368ms step_avg:231.58ms step:6497/6710 train_time:1504613ms step_avg:231.59ms step:6498/6710 train_time:1504861ms step_avg:231.59ms step:6499/6710 train_time:1505111ms step_avg:231.59ms step:6500/6710 train_time:1505355ms step_avg:231.59ms step:6500/6710 val_loss:2.924802 train_time:1505547ms step_avg:231.62ms Parameter containing: tensor([1.0000, 1.0000, 0.4023, 1.0000, 0.4595, 1.0000, 0.3557, 1.0000], device='cuda:0', requires_grad=True) 0 [6.727221965789795, 5.727220058441162] 1 [0.47845402359962463, 4.835204124450684] 2 [0.5829335451126099, 2.588350772857666] 3 [0.6764237284660339, 2.2232024669647217] 4 [0.4122019410133362, 1.6668802499771118] 5 [0.5868810415267944, 2.122805118560791] 6 [0.5195006132125854, 1.3047428131103516] 7 [0.6617592573165894, 4.016378402709961] 8 [0.49508392810821533, -0.15552102029323578] 9 [0.48629847168922424, 1.1203070878982544] 10 [0.6122664213180542, 1.6404474973678589] 11 [0.46183985471725464, 1.6996454000473022] 12 [0.8474966287612915, 4.7484822273254395] 13 [0.9075577259063721, 2.5020852088928223] 14 [0.9114769697189331, 0.580877423286438] 15 [0.8938398361206055, -0.526146411895752] 0 [12.456518173217773, 18.622703552246094, 25.885419845581055] 1 [21.82389259338379, 19.492403030395508, 53.98290252685547] 2 [40.90663146972656, 14.82417106628418, 21.032373428344727] 3 [38.3958854675293, 19.784915924072266, 24.884305953979492] 4 [25.134828567504883, 18.774267196655273, 23.58211898803711] 5 [29.534414291381836, 17.814233779907227, 27.890796661376953] 6 [28.825668334960938, 20.416086196899414, 21.892667770385742] 7 [35.01020431518555, 0.0, 28.890012741088867] 8 [26.09318733215332, 20.244564056396484, 31.78197479248047] 9 [34.69511413574219, 17.697052001953125, 26.577260971069336] 10 [44.98711013793945, 19.030885696411133, 26.297956466674805] 11 [38.72028732299805, 23.392242431640625, 17.062551498413086] 12 [54.28318786621094, 19.734325408935547, 17.714881896972656] 13 [67.20268249511719, 13.076300621032715, 19.104856491088867] 14 [72.23493957519531, 15.093877792358398, 24.85576629638672] 15 [77.51596069335938, 54.60897445678711, 85.33008575439453] step:6501/6710 train_time:1505599ms step_avg:231.60ms step:6502/6710 train_time:1505844ms step_avg:231.60ms step:6503/6710 train_time:1506087ms step_avg:231.60ms step:6504/6710 train_time:1506337ms step_avg:231.60ms step:6505/6710 train_time:1506580ms step_avg:231.60ms step:6506/6710 train_time:1506828ms step_avg:231.61ms step:6507/6710 train_time:1507070ms step_avg:231.61ms step:6508/6710 train_time:1507314ms step_avg:231.61ms step:6509/6710 train_time:1507563ms step_avg:231.61ms step:6510/6710 train_time:1507805ms step_avg:231.61ms step:6511/6710 train_time:1508048ms step_avg:231.62ms step:6512/6710 train_time:1508293ms step_avg:231.62ms step:6513/6710 train_time:1508538ms step_avg:231.62ms step:6514/6710 train_time:1508778ms step_avg:231.62ms step:6515/6710 train_time:1509035ms step_avg:231.62ms step:6516/6710 train_time:1509277ms step_avg:231.63ms step:6517/6710 train_time:1509525ms step_avg:231.63ms step:6518/6710 train_time:1509767ms step_avg:231.63ms step:6519/6710 train_time:1510013ms step_avg:231.63ms step:6520/6710 train_time:1510259ms step_avg:231.63ms step:6521/6710 train_time:1510503ms step_avg:231.64ms step:6522/6710 train_time:1510745ms step_avg:231.64ms step:6523/6710 train_time:1510989ms step_avg:231.64ms step:6524/6710 train_time:1511232ms step_avg:231.64ms step:6525/6710 train_time:1511477ms step_avg:231.64ms step:6526/6710 train_time:1511719ms step_avg:231.65ms step:6527/6710 train_time:1511964ms step_avg:231.65ms step:6528/6710 train_time:1512205ms step_avg:231.65ms step:6529/6710 train_time:1512452ms step_avg:231.65ms step:6530/6710 train_time:1512699ms step_avg:231.65ms step:6531/6710 train_time:1512944ms step_avg:231.66ms step:6532/6710 train_time:1513188ms step_avg:231.66ms step:6533/6710 train_time:1513433ms step_avg:231.66ms step:6534/6710 train_time:1513679ms step_avg:231.66ms step:6535/6710 train_time:1513930ms step_avg:231.66ms step:6536/6710 train_time:1514178ms step_avg:231.67ms step:6537/6710 train_time:1514421ms step_avg:231.67ms step:6538/6710 train_time:1514666ms step_avg:231.67ms step:6539/6710 train_time:1514913ms step_avg:231.67ms step:6540/6710 train_time:1515158ms step_avg:231.68ms step:6541/6710 train_time:1515406ms step_avg:231.68ms step:6542/6710 train_time:1515657ms step_avg:231.68ms step:6543/6710 train_time:1515907ms step_avg:231.68ms step:6544/6710 train_time:1516156ms step_avg:231.69ms step:6545/6710 train_time:1516396ms step_avg:231.69ms step:6546/6710 train_time:1516642ms step_avg:231.69ms step:6547/6710 train_time:1516883ms step_avg:231.69ms step:6548/6710 train_time:1517126ms step_avg:231.69ms step:6549/6710 train_time:1517371ms step_avg:231.70ms step:6550/6710 train_time:1517614ms step_avg:231.70ms step:6551/6710 train_time:1517861ms step_avg:231.70ms step:6552/6710 train_time:1518106ms step_avg:231.70ms step:6553/6710 train_time:1518349ms step_avg:231.70ms step:6554/6710 train_time:1518591ms step_avg:231.70ms step:6555/6710 train_time:1518834ms step_avg:231.71ms step:6556/6710 train_time:1519082ms step_avg:231.71ms step:6557/6710 train_time:1519325ms step_avg:231.71ms step:6558/6710 train_time:1519567ms step_avg:231.71ms step:6559/6710 train_time:1519810ms step_avg:231.71ms step:6560/6710 train_time:1520057ms step_avg:231.72ms step:6561/6710 train_time:1520304ms step_avg:231.72ms step:6562/6710 train_time:1520552ms step_avg:231.72ms step:6563/6710 train_time:1520796ms step_avg:231.72ms step:6564/6710 train_time:1521040ms step_avg:231.72ms step:6565/6710 train_time:1521284ms step_avg:231.73ms step:6566/6710 train_time:1521528ms step_avg:231.73ms step:6567/6710 train_time:1521779ms step_avg:231.73ms step:6568/6710 train_time:1522021ms step_avg:231.73ms step:6569/6710 train_time:1522266ms step_avg:231.73ms step:6570/6710 train_time:1522508ms step_avg:231.74ms step:6571/6710 train_time:1522753ms step_avg:231.74ms step:6572/6710 train_time:1522995ms step_avg:231.74ms step:6573/6710 train_time:1523241ms step_avg:231.74ms step:6574/6710 train_time:1523485ms step_avg:231.74ms step:6575/6710 train_time:1523732ms step_avg:231.75ms step:6576/6710 train_time:1523976ms step_avg:231.75ms step:6577/6710 train_time:1524218ms step_avg:231.75ms step:6578/6710 train_time:1524462ms step_avg:231.75ms step:6579/6710 train_time:1524707ms step_avg:231.75ms step:6580/6710 train_time:1524951ms step_avg:231.76ms step:6581/6710 train_time:1525196ms step_avg:231.76ms step:6582/6710 train_time:1525440ms step_avg:231.76ms step:6583/6710 train_time:1525684ms step_avg:231.76ms step:6584/6710 train_time:1525929ms step_avg:231.76ms step:6585/6710 train_time:1526170ms step_avg:231.76ms step:6586/6710 train_time:1526413ms step_avg:231.77ms step:6587/6710 train_time:1526656ms step_avg:231.77ms step:6588/6710 train_time:1526903ms step_avg:231.77ms step:6589/6710 train_time:1527145ms step_avg:231.77ms step:6590/6710 train_time:1527394ms step_avg:231.77ms step:6591/6710 train_time:1527639ms step_avg:231.78ms step:6592/6710 train_time:1527883ms step_avg:231.78ms step:6593/6710 train_time:1528127ms step_avg:231.78ms step:6594/6710 train_time:1528372ms step_avg:231.78ms step:6595/6710 train_time:1528616ms step_avg:231.78ms step:6596/6710 train_time:1528860ms step_avg:231.79ms step:6597/6710 train_time:1529106ms step_avg:231.79ms step:6598/6710 train_time:1529347ms step_avg:231.79ms step:6599/6710 train_time:1529594ms step_avg:231.79ms step:6600/6710 train_time:1529834ms step_avg:231.79ms step:6601/6710 train_time:1530079ms step_avg:231.80ms step:6602/6710 train_time:1530324ms step_avg:231.80ms step:6603/6710 train_time:1530569ms step_avg:231.80ms step:6604/6710 train_time:1530820ms step_avg:231.80ms step:6605/6710 train_time:1531062ms step_avg:231.80ms step:6606/6710 train_time:1531305ms step_avg:231.81ms step:6607/6710 train_time:1531547ms step_avg:231.81ms step:6608/6710 train_time:1531790ms step_avg:231.81ms step:6609/6710 train_time:1532034ms step_avg:231.81ms step:6610/6710 train_time:1532277ms step_avg:231.81ms step:6611/6710 train_time:1532524ms step_avg:231.81ms step:6612/6710 train_time:1532772ms step_avg:231.82ms step:6613/6710 train_time:1533017ms step_avg:231.82ms step:6614/6710 train_time:1533263ms step_avg:231.82ms step:6615/6710 train_time:1533506ms step_avg:231.82ms step:6616/6710 train_time:1533750ms step_avg:231.82ms step:6617/6710 train_time:1533992ms step_avg:231.83ms step:6618/6710 train_time:1534235ms step_avg:231.83ms step:6619/6710 train_time:1534478ms step_avg:231.83ms step:6620/6710 train_time:1534725ms step_avg:231.83ms step:6621/6710 train_time:1534967ms step_avg:231.83ms step:6622/6710 train_time:1535214ms step_avg:231.84ms step:6623/6710 train_time:1535460ms step_avg:231.84ms step:6624/6710 train_time:1535703ms step_avg:231.84ms step:6625/6710 train_time:1535945ms step_avg:231.84ms step:6625/6710 val_loss:2.920650 train_time:1536143ms step_avg:231.87ms Parameter containing: tensor([1.0000, 1.0000, 0.4025, 1.0000, 0.4559, 1.0000, 0.3513, 1.0000], device='cuda:0', requires_grad=True) 0 [6.707387447357178, 5.707385540008545] 1 [0.47789493203163147, 4.805120944976807] 2 [0.5814921259880066, 2.5591466426849365] 3 [0.6762888431549072, 2.197115421295166] 4 [0.4130380153656006, 1.64419686794281] 5 [0.5872757434844971, 2.094630002975464] 6 [0.5195950865745544, 1.2839306592941284] 7 [0.6595669388771057, 4.000247955322266] 8 [0.4967277944087982, -0.16919419169425964] 9 [0.4853697419166565, 1.105457067489624] 10 [0.6105075478553772, 1.6251214742660522] 11 [0.4611378014087677, 1.6825411319732666] 12 [0.8481631875038147, 4.727644443511963] 13 [0.9057088494300842, 2.4930179119110107] 14 [0.9103259444236755, 0.5738170146942139] 15 [0.8926184773445129, -0.5324099659919739] 0 [12.4159574508667, 18.506893157958984, 25.85569190979004] 1 [21.728607177734375, 19.33659553527832, 53.601993560791016] 2 [40.53390884399414, 14.700860023498535, 20.980636596679688] 3 [38.09153747558594, 19.648178100585938, 24.831897735595703] 4 [25.021114349365234, 18.68170166015625, 23.54616928100586] 5 [29.43701171875, 17.71674156188965, 27.72314453125] 6 [28.68111801147461, 20.311113357543945, 21.74979591369629] 7 [34.71067810058594, 0.0, 28.742389678955078] 8 [25.997739791870117, 20.129213333129883, 31.786827087402344] 9 [34.43904113769531, 17.600526809692383, 26.52969741821289] 10 [44.559322357177734, 18.91846466064453, 26.27433967590332] 11 [38.40502166748047, 23.237768173217773, 17.07935333251953] 12 [53.98358917236328, 19.635438919067383, 17.663928985595703] 13 [66.7222900390625, 12.961355209350586, 19.037315368652344] 14 [71.66450500488281, 14.947393417358398, 24.692058563232422] 15 [76.85059356689453, 54.28715515136719, 84.43781280517578] step:6626/6710 train_time:1536194ms step_avg:231.84ms step:6627/6710 train_time:1536439ms step_avg:231.85ms step:6628/6710 train_time:1536685ms step_avg:231.85ms step:6629/6710 train_time:1536927ms step_avg:231.85ms step:6630/6710 train_time:1537171ms step_avg:231.85ms step:6631/6710 train_time:1537414ms step_avg:231.85ms step:6632/6710 train_time:1537660ms step_avg:231.85ms step:6633/6710 train_time:1537903ms step_avg:231.86ms step:6634/6710 train_time:1538144ms step_avg:231.86ms step:6635/6710 train_time:1538386ms step_avg:231.86ms step:6636/6710 train_time:1538634ms step_avg:231.86ms step:6637/6710 train_time:1538876ms step_avg:231.86ms step:6638/6710 train_time:1539123ms step_avg:231.87ms step:6639/6710 train_time:1539367ms step_avg:231.87ms step:6640/6710 train_time:1539609ms step_avg:231.87ms step:6641/6710 train_time:1539854ms step_avg:231.87ms step:6642/6710 train_time:1540099ms step_avg:231.87ms step:6643/6710 train_time:1540341ms step_avg:231.87ms step:6644/6710 train_time:1540586ms step_avg:231.88ms step:6645/6710 train_time:1540836ms step_avg:231.88ms step:6646/6710 train_time:1541086ms step_avg:231.88ms step:6647/6710 train_time:1541328ms step_avg:231.88ms step:6648/6710 train_time:1541575ms step_avg:231.89ms step:6649/6710 train_time:1541827ms step_avg:231.89ms step:6650/6710 train_time:1542073ms step_avg:231.89ms step:6651/6710 train_time:1542317ms step_avg:231.89ms step:6652/6710 train_time:1542558ms step_avg:231.89ms step:6653/6710 train_time:1542808ms step_avg:231.90ms step:6654/6710 train_time:1543051ms step_avg:231.90ms step:6655/6710 train_time:1543292ms step_avg:231.90ms step:6656/6710 train_time:1543537ms step_avg:231.90ms step:6657/6710 train_time:1543789ms step_avg:231.90ms step:6658/6710 train_time:1544031ms step_avg:231.91ms step:6659/6710 train_time:1544277ms step_avg:231.91ms step:6660/6710 train_time:1544520ms step_avg:231.91ms step:6661/6710 train_time:1544764ms step_avg:231.91ms step:6662/6710 train_time:1545008ms step_avg:231.91ms step:6663/6710 train_time:1545257ms step_avg:231.92ms step:6664/6710 train_time:1545499ms step_avg:231.92ms step:6665/6710 train_time:1545742ms step_avg:231.92ms step:6666/6710 train_time:1545985ms step_avg:231.92ms step:6667/6710 train_time:1546233ms step_avg:231.92ms step:6668/6710 train_time:1546478ms step_avg:231.93ms step:6669/6710 train_time:1546720ms step_avg:231.93ms step:6670/6710 train_time:1546962ms step_avg:231.93ms step:6671/6710 train_time:1547209ms step_avg:231.93ms step:6672/6710 train_time:1547456ms step_avg:231.93ms step:6673/6710 train_time:1547700ms step_avg:231.93ms step:6674/6710 train_time:1547944ms step_avg:231.94ms step:6675/6710 train_time:1548190ms step_avg:231.94ms step:6676/6710 train_time:1548438ms step_avg:231.94ms step:6677/6710 train_time:1548678ms step_avg:231.94ms step:6678/6710 train_time:1548923ms step_avg:231.94ms step:6679/6710 train_time:1549169ms step_avg:231.95ms step:6680/6710 train_time:1549413ms step_avg:231.95ms step:6681/6710 train_time:1549657ms step_avg:231.95ms step:6682/6710 train_time:1549900ms step_avg:231.95ms step:6683/6710 train_time:1550143ms step_avg:231.95ms step:6684/6710 train_time:1550387ms step_avg:231.95ms step:6685/6710 train_time:1550633ms step_avg:231.96ms step:6686/6710 train_time:1550877ms step_avg:231.96ms step:6687/6710 train_time:1551120ms step_avg:231.96ms step:6688/6710 train_time:1551365ms step_avg:231.96ms step:6689/6710 train_time:1551616ms step_avg:231.97ms step:6690/6710 train_time:1551857ms step_avg:231.97ms step:6691/6710 train_time:1552100ms step_avg:231.97ms step:6692/6710 train_time:1552345ms step_avg:231.97ms step:6693/6710 train_time:1552588ms step_avg:231.97ms step:6694/6710 train_time:1552844ms step_avg:231.98ms step:6695/6710 train_time:1553084ms step_avg:231.98ms step:6696/6710 train_time:1553328ms step_avg:231.98ms step:6697/6710 train_time:1553575ms step_avg:231.98ms step:6698/6710 train_time:1553820ms step_avg:231.98ms step:6699/6710 train_time:1554064ms step_avg:231.98ms step:6700/6710 train_time:1554306ms step_avg:231.99ms step:6701/6710 train_time:1554553ms step_avg:231.99ms step:6702/6710 train_time:1554799ms step_avg:231.99ms step:6703/6710 train_time:1555039ms step_avg:231.99ms step:6704/6710 train_time:1555282ms step_avg:231.99ms step:6705/6710 train_time:1555527ms step_avg:232.00ms step:6706/6710 train_time:1555770ms step_avg:232.00ms step:6707/6710 train_time:1556014ms step_avg:232.00ms step:6708/6710 train_time:1556258ms step_avg:232.00ms step:6709/6710 train_time:1556504ms step_avg:232.00ms step:6710/6710 train_time:1556752ms step_avg:232.00ms step:6710/6710 val_loss:2.919423 train_time:1556945ms step_avg:232.03ms Parameter containing: tensor([1.0000, 1.0000, 0.4016, 1.0000, 0.4562, 1.0000, 0.3507, 1.0000], device='cuda:0', requires_grad=True) 0 [6.7038774490356445, 5.703875541687012] 1 [0.477759450674057, 4.798025131225586] 2 [0.5816054940223694, 2.552415609359741] 3 [0.6770597696304321, 2.1910054683685303] 4 [0.4131503701210022, 1.6386264562606812] 5 [0.5847637057304382, 2.088890552520752] 6 [0.518068253993988, 1.2770161628723145] 7 [0.660163402557373, 3.9944875240325928] 8 [0.4957553446292877, -0.17441272735595703] 9 [0.48536384105682373, 1.101366400718689] 10 [0.6116793155670166, 1.6212794780731201] 11 [0.46183815598487854, 1.6780327558517456] 12 [0.8482258319854736, 4.723046779632568] 13 [0.9057905673980713, 2.490715742111206] 14 [0.9103605151176453, 0.5717687010765076] 15 [0.8926903009414673, -0.5348918437957764] 0 [12.408071517944336, 18.472332000732422, 25.90549087524414] 1 [21.720386505126953, 19.293292999267578, 53.450286865234375] 2 [40.45405578613281, 14.6719970703125, 20.9440975189209] 3 [38.062644958496094, 19.617706298828125, 24.782140731811523] 4 [24.996788024902344, 18.651926040649414, 23.495874404907227] 5 [29.277708053588867, 17.693845748901367, 27.74502944946289] 6 [28.534942626953125, 20.30355453491211, 21.739580154418945] 7 [34.6474609375, 0.0, 28.709619522094727] 8 [25.909074783325195, 20.10503578186035, 31.71550941467285] 9 [34.335227966308594, 17.56568717956543, 26.49164581298828] 10 [44.54132080078125, 18.887948989868164, 26.25318717956543] 11 [38.41272735595703, 23.228961944580078, 17.077192306518555] 12 [53.99139404296875, 19.60881996154785, 17.674339294433594] 13 [66.71878814697266, 12.924132347106934, 19.03748893737793] 14 [71.65132904052734, 14.913959503173828, 24.71126365661621] 15 [76.83695220947266, 54.23273468017578, 84.48335266113281] peak memory allocated: 57971 MiB reserved: 69054 MiB