In [133]:
n = 10
L = 20
num_heads = 4
attn_weight = torch.rand(n, 4, L, L)

In [134]:
num_heads = attn_weight.shape[1]
attn_weight = attn_weight.transpose(0, 1)
attn_weight = attn_weight.transpose(1, 2) # L first
attn_weight = attn_weight.contiguous().view(num_heads, L, -1) # collapse to shape L x N L
attn_weight = n*attn_weight.softmax(-1) # softmax across weights across batch and positions
attn_weight = attn_weight.view(num_heads, L, n, L).transpose(1, 2).transpose(0, 1) # transform back to N x L x L

In [107]:
# attn_weight.sum(-1)

In [108]:
# verify 
# attn_weight.transpose(0, 1).sum(-1).sum(-1)

In [94]:
from torch.nn.functional import _in_projection_packed, linear
import math
import torch.nn as nn
from typing import Optional, Tuple
import torch
from torch import Tensor
from torch.nn.parameter import Parameter
from torch.nn.modules.linear import NonDynamicallyQuantizableLinear

import warnings
from typing import Optional, Tuple

import torch
from torch import Tensor
from torch.nn.init import constant_, xavier_normal_, xavier_uniform_
from torch.nn.parameter import Parameter
import torch.nn.functional as F


def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.0, is_causal=False, scale=None) -> torch.Tensor:
    # Efficient implementation equivalent to the following:
    L, S = query.size(-2), key.size(-2)
    scale_factor = 1 / math.sqrt(query.size(-1)) if scale is None else scale
    attn_bias = torch.zeros(L, S, dtype=query.dtype)
    device = query.device
    attn_bias = attn_bias.to(device)
    if is_causal:
        assert attn_mask is None
        temp_mask = torch.ones(L, S, dtype=torch.bool).tril(diagonal=0)
        attn_bias.masked_fill_(temp_mask.logical_not(), float("-inf"))
        attn_bias.to(query.dtype)

    if attn_mask is not None:
        if attn_mask.dtype == torch.bool:
            attn_mask.masked_fill_(attn_mask.logical_not(), float("-inf"))
        else:
            attn_bias += attn_mask
    attn_weight = query @ key.transpose(-2, -1) * scale_factor
    attn_weight += attn_bias
    # attn_weight = torch.softmax(attn_weight, dim=-1)
    # attn_weight = torch.exp(attn_weight)/torch.exp(attn_weight).sum()
    attn_weight = torch.sigmoid(attn_weight)
    attn_weight_ = torch.dropout(attn_weight, dropout_p, train=True)
    return attn_weight_ @ value, attn_weight


def multi_head_attention_forward(
    query: Tensor,
    key: Tensor,
    value: Tensor,
    embed_dim_to_check: int,
    num_heads: int,
    in_proj_weight: Optional[Tensor],
    in_proj_bias: Optional[Tensor],
    bias_k: Optional[Tensor],
    bias_v: Optional[Tensor],
    add_zero_attn: bool,
    dropout_p: float,
    out_proj_weight: Tensor,
    out_proj_bias: Optional[Tensor],
    training: bool = True,
    key_padding_mask: Optional[Tensor] = None,
    need_weights: bool = True,
    attn_mask: Optional[Tensor] = None,
    use_separate_proj_weight: bool = False,
    q_proj_weight: Optional[Tensor] = None,
    k_proj_weight: Optional[Tensor] = None,
    v_proj_weight: Optional[Tensor] = None,
    static_k: Optional[Tensor] = None,
    static_v: Optional[Tensor] = None,
    average_attn_weights: bool = True,
    is_causal: bool = False,
) -> Tuple[Tensor, Optional[Tensor]]:


    # set up shape vars
    tgt_len, bsz, embed_dim = query.shape
    src_len, _, _ = key.shape

    if isinstance(embed_dim, torch.Tensor):
        # embed_dim can be a tensor when JIT tracing
        head_dim = embed_dim.div(num_heads, rounding_mode='trunc')
    else:
        head_dim = embed_dim // num_heads
    assert head_dim * num_heads == embed_dim, f"embed_dim {embed_dim} not divisible by num_heads {num_heads}"
    if use_separate_proj_weight:
        # allow MHA to have different embedding dimensions when separate projection weights are used
        assert key.shape[:2] == value.shape[:2], \
            f"key's sequence and batch dims {key.shape[:2]} do not match value's {value.shape[:2]}"
    else:
        assert key.shape == value.shape, f"key shape {key.shape} does not match value shape {value.shape}"

    #
    # compute in-projection
    #
    if not use_separate_proj_weight:
        assert in_proj_weight is not None, "use_separate_proj_weight is False but in_proj_weight is None"
        q, k, v = _in_projection_packed(query, key, value, in_proj_weight, in_proj_bias)
    else:
        assert q_proj_weight is not None, "use_separate_proj_weight is True but q_proj_weight is None"
        assert k_proj_weight is not None, "use_separate_proj_weight is True but k_proj_weight is None"
        assert v_proj_weight is not None, "use_separate_proj_weight is True but v_proj_weight is None"
        if in_proj_bias is None:
            b_q = b_k = b_v = None
        else:
            b_q, b_k, b_v = in_proj_bias.chunk(3)
        q, k, v = _in_projection(query, key, value, q_proj_weight, k_proj_weight, v_proj_weight, b_q, b_k, b_v)


    # add bias along batch dimension (currently second)
    if bias_k is not None and bias_v is not None:
        assert static_k is None, "bias cannot be added to static key."
        assert static_v is None, "bias cannot be added to static value."
        k = torch.cat([k, bias_k.repeat(1, bsz, 1)])
        v = torch.cat([v, bias_v.repeat(1, bsz, 1)])
        if attn_mask is not None:
            attn_mask = pad(attn_mask, (0, 1))
        if key_padding_mask is not None:
            key_padding_mask = pad(key_padding_mask, (0, 1))
    else:
        assert bias_k is None
        assert bias_v is None

    #
    # reshape q, k, v for multihead attention and make em batch first
    #
    q = q.view(tgt_len, bsz * num_heads, head_dim).transpose(0, 1)
    if static_k is None:
        k = k.view(k.shape[0], bsz * num_heads, head_dim).transpose(0, 1)
    else:
        # TODO finish disentangling control flow so we don't do in-projections when statics are passed
        assert static_k.size(0) == bsz * num_heads, \
            f"expecting static_k.size(0) of {bsz * num_heads}, but got {static_k.size(0)}"
        assert static_k.size(2) == head_dim, \
            f"expecting static_k.size(2) of {head_dim}, but got {static_k.size(2)}"
        k = static_k
    if static_v is None:
        v = v.view(v.shape[0], bsz * num_heads, head_dim).transpose(0, 1)
    else:
        # TODO finish disentangling control flow so we don't do in-projections when statics are passed
        assert static_v.size(0) == bsz * num_heads, \
            f"expecting static_v.size(0) of {bsz * num_heads}, but got {static_v.size(0)}"
        assert static_v.size(2) == head_dim, \
            f"expecting static_v.size(2) of {head_dim}, but got {static_v.size(2)}"
        v = static_v

    # add zero attention along batch dimension (now first)
    if add_zero_attn:
        zero_attn_shape = (bsz * num_heads, 1, head_dim)
        k = torch.cat([k, torch.zeros(zero_attn_shape, dtype=k.dtype, device=k.device)], dim=1)
        v = torch.cat([v, torch.zeros(zero_attn_shape, dtype=v.dtype, device=v.device)], dim=1)
        if attn_mask is not None:
            attn_mask = pad(attn_mask, (0, 1))
        if key_padding_mask is not None:
            key_padding_mask = pad(key_padding_mask, (0, 1))

    # update source sequence length after adjustments
    src_len = k.size(1)

    # adjust dropout probability
    if not training:
        dropout_p = 0.0

    #
    # (deep breath) calculate attention and out projection
    #


    q = q.view(bsz, num_heads, tgt_len, head_dim)
    k = k.view(bsz, num_heads, src_len, head_dim)
    v = v.view(bsz, num_heads, src_len, head_dim)

    attn_output, attn_weights = scaled_dot_product_attention(q, k, v, attn_mask, dropout_p, is_causal)
    attn_output = attn_output.permute(2, 0, 1, 3).contiguous().view(bsz * tgt_len, embed_dim)

    attn_output = linear(attn_output, out_proj_weight, out_proj_bias)
    attn_output = attn_output.view(tgt_len, bsz, attn_output.size(1))
    # if not is_batched:
    #     # squeeze the output if input was unbatched
    #     attn_output = attn_output.squeeze(1)
    return attn_output, attn_weights


class MultiheadAttention(nn.Module):
    r"""Allows the model to jointly attend to information
    from different representation subspaces as described in the paper:
    `Attention Is All You Need <https://arxiv.org/abs/1706.03762>`_.

    Multi-Head Attention is defined as:

    .. math::
        \text{MultiHead}(Q, K, V) = \text{Concat}(head_1,\dots,head_h)W^O

    where :math:`head_i = \text{Attention}(QW_i^Q, KW_i^K, VW_i^V)`.

    ``nn.MultiHeadAttention`` will use the optimized implementations of
    ``scaled_dot_product_attention()`` when possible.

    In addition to support for the new ``scaled_dot_product_attention()``
    function, for speeding up Inference, MHA will use
    fastpath inference with support for Nested Tensors, iff:

    - self attention is being computed (i.e., ``query``, ``key``, and ``value`` are the same tensor).
    - inputs are batched (3D) with ``batch_first==True``
    - Either autograd is disabled (using ``torch.inference_mode`` or ``torch.no_grad``) or no tensor argument ``requires_grad``
    - training is disabled (using ``.eval()``)
    - ``add_bias_kv`` is ``False``
    - ``add_zero_attn`` is ``False``
    - ``batch_first`` is ``True`` and the input is batched
    - ``kdim`` and ``vdim`` are equal to ``embed_dim``
    - if a `NestedTensor <https://pytorch.org/docs/stable/nested.html>`_ is passed, neither ``key_padding_mask``
      nor ``attn_mask`` is passed
    - autocast is disabled

    If the optimized inference fastpath implementation is in use, a
    `NestedTensor <https://pytorch.org/docs/stable/nested.html>`_ can be passed for
    ``query``/``key``/``value`` to represent padding more efficiently than using a
    padding mask. In this case, a `NestedTensor <https://pytorch.org/docs/stable/nested.html>`_
    will be returned, and an additional speedup proportional to the fraction of the input
    that is padding can be expected.

    Args:
        embed_dim: Total dimension of the model.
        num_heads: Number of parallel attention heads. Note that ``embed_dim`` will be split
            across ``num_heads`` (i.e. each head will have dimension ``embed_dim // num_heads``).
        dropout: Dropout probability on ``attn_output_weights``. Default: ``0.0`` (no dropout).
        bias: If specified, adds bias to input / output projection layers. Default: ``True``.
        add_bias_kv: If specified, adds bias to the key and value sequences at dim=0. Default: ``False``.
        add_zero_attn: If specified, adds a new batch of zeros to the key and value sequences at dim=1.
            Default: ``False``.
        kdim: Total number of features for keys. Default: ``None`` (uses ``kdim=embed_dim``).
        vdim: Total number of features for values. Default: ``None`` (uses ``vdim=embed_dim``).
        batch_first: If ``True``, then the input and output tensors are provided
            as (batch, seq, feature). Default: ``False`` (seq, batch, feature).

    Examples::

        >>> # xdoctest: +SKIP
        >>> multihead_attn = nn.MultiheadAttention(embed_dim, num_heads)
        >>> attn_output, attn_output_weights = multihead_attn(query, key, value)

    .. _`FlashAttention: Fast and Memory-Efficient Exact Attention with IO-Awareness`:
         https://arxiv.org/abs/2205.14135

    """

    __constants__ = ['batch_first']
    bias_k: Optional[torch.Tensor]
    bias_v: Optional[torch.Tensor]

    def __init__(self, embed_dim, num_heads, dropout=0., bias=True, add_bias_kv=False, add_zero_attn=False,
                 kdim=None, vdim=None, batch_first=False, device=None, dtype=None) -> None:
        if embed_dim <= 0 or num_heads <= 0:
            raise ValueError(
                f"embed_dim and num_heads must be greater than 0,"
                f" got embed_dim={embed_dim} and num_heads={num_heads} instead"
            )
        factory_kwargs = {'device': device, 'dtype': dtype}
        super().__init__()
        self.embed_dim = embed_dim
        self.kdim = kdim if kdim is not None else embed_dim
        self.vdim = vdim if vdim is not None else embed_dim
        self._qkv_same_embed_dim = self.kdim == embed_dim and self.vdim == embed_dim

        self.num_heads = num_heads
        self.dropout = dropout
        self.batch_first = batch_first
        self.head_dim = embed_dim // num_heads
        assert self.head_dim * num_heads == self.embed_dim, "embed_dim must be divisible by num_heads"

        if not self._qkv_same_embed_dim:
            self.q_proj_weight = Parameter(torch.empty((embed_dim, embed_dim), **factory_kwargs))
            self.k_proj_weight = Parameter(torch.empty((embed_dim, self.kdim), **factory_kwargs))
            self.v_proj_weight = Parameter(torch.empty((embed_dim, self.vdim), **factory_kwargs))
            self.register_parameter('in_proj_weight', None)
        else:
            self.in_proj_weight = Parameter(torch.empty((3 * embed_dim, embed_dim), **factory_kwargs))
            self.register_parameter('q_proj_weight', None)
            self.register_parameter('k_proj_weight', None)
            self.register_parameter('v_proj_weight', None)

        if bias:
            self.in_proj_bias = Parameter(torch.empty(3 * embed_dim, **factory_kwargs))
        else:
            self.register_parameter('in_proj_bias', None)
        self.out_proj = NonDynamicallyQuantizableLinear(embed_dim, embed_dim, bias=bias, **factory_kwargs)

        if add_bias_kv:
            self.bias_k = Parameter(torch.empty((1, 1, embed_dim), **factory_kwargs))
            self.bias_v = Parameter(torch.empty((1, 1, embed_dim), **factory_kwargs))
        else:
            self.bias_k = self.bias_v = None

        self.add_zero_attn = add_zero_attn

        self._reset_parameters()

    def _reset_parameters(self):
        if self._qkv_same_embed_dim:
            xavier_uniform_(self.in_proj_weight)
        else:
            xavier_uniform_(self.q_proj_weight)
            xavier_uniform_(self.k_proj_weight)
            xavier_uniform_(self.v_proj_weight)

        if self.in_proj_bias is not None:
            constant_(self.in_proj_bias, 0.)
            constant_(self.out_proj.bias, 0.)
        if self.bias_k is not None:
            xavier_normal_(self.bias_k)
        if self.bias_v is not None:
            xavier_normal_(self.bias_v)

    def __setstate__(self, state):
        # Support loading old MultiheadAttention checkpoints generated by v1.1.0
        if '_qkv_same_embed_dim' not in state:
            state['_qkv_same_embed_dim'] = True

        super().__setstate__(state)

    def forward(
        self,
        query: Tensor,
        key: Tensor,
        value: Tensor,
        key_padding_mask: Optional[Tensor] = None,
        need_weights: bool = True,
        attn_mask: Optional[Tensor] = None,
        average_attn_weights: bool = True,
        is_causal : bool = False) -> Tuple[Tensor, Optional[Tensor]]:
        r"""
    Args:
        query: Query embeddings of shape :math:`(L, E_q)` for unbatched input, :math:`(L, N, E_q)` when ``batch_first=False``
            or :math:`(N, L, E_q)` when ``batch_first=True``, where :math:`L` is the target sequence length,
            :math:`N` is the batch size, and :math:`E_q` is the query embedding dimension ``embed_dim``.
            Queries are compared against key-value pairs to produce the output.
            See "Attention Is All You Need" for more details.
        key: Key embeddings of shape :math:`(S, E_k)` for unbatched input, :math:`(S, N, E_k)` when ``batch_first=False``
            or :math:`(N, S, E_k)` when ``batch_first=True``, where :math:`S` is the source sequence length,
            :math:`N` is the batch size, and :math:`E_k` is the key embedding dimension ``kdim``.
            See "Attention Is All You Need" for more details.
        value: Value embeddings of shape :math:`(S, E_v)` for unbatched input, :math:`(S, N, E_v)` when
            ``batch_first=False`` or :math:`(N, S, E_v)` when ``batch_first=True``, where :math:`S` is the source
            sequence length, :math:`N` is the batch size, and :math:`E_v` is the value embedding dimension ``vdim``.
            See "Attention Is All You Need" for more details.
        key_padding_mask: If specified, a mask of shape :math:`(N, S)` indicating which elements within ``key``
            to ignore for the purpose of attention (i.e. treat as "padding"). For unbatched `query`, shape should be :math:`(S)`.
            Binary and float masks are supported.
            For a binary mask, a ``True`` value indicates that the corresponding ``key`` value will be ignored for
            the purpose of attention. For a float mask, it will be directly added to the corresponding ``key`` value.
        need_weights: If specified, returns ``attn_output_weights`` in addition to ``attn_outputs``.
            Set ``need_weights=False`` to use the optimized ``scaled_dot_product_attention``
            and achieve the best performance for MHA.
            Default: ``True``.
        attn_mask: If specified, a 2D or 3D mask preventing attention to certain positions. Must be of shape
            :math:`(L, S)` or :math:`(N\cdot\text{num\_heads}, L, S)`, where :math:`N` is the batch size,
            :math:`L` is the target sequence length, and :math:`S` is the source sequence length. A 2D mask will be
            broadcasted across the batch while a 3D mask allows for a different mask for each entry in the batch.
            Binary and float masks are supported. For a binary mask, a ``True`` value indicates that the
            corresponding position is not allowed to attend. For a float mask, the mask values will be added to
            the attention weight.
            If both attn_mask and key_padding_mask are supplied, their types should match.
        average_attn_weights: If true, indicates that the returned ``attn_weights`` should be averaged across
            heads. Otherwise, ``attn_weights`` are provided separately per head. Note that this flag only has an
            effect when ``need_weights=True``. Default: ``True`` (i.e. average weights across heads)
        is_causal: If specified, applies a causal mask as attention mask.
            Default: ``False``.
            Warning:
            ``is_causal`` provides a hint that ``attn_mask`` is the
            causal mask. Providing incorrect hints can result in
            incorrect execution, including forward and backward
            compatibility.

    Outputs:
        - **attn_output** - Attention outputs of shape :math:`(L, E)` when input is unbatched,
          :math:`(L, N, E)` when ``batch_first=False`` or :math:`(N, L, E)` when ``batch_first=True``,
          where :math:`L` is the target sequence length, :math:`N` is the batch size, and :math:`E` is the
          embedding dimension ``embed_dim``.
        - **attn_output_weights** - Only returned when ``need_weights=True``. If ``average_attn_weights=True``,
          returns attention weights averaged across heads of shape :math:`(L, S)` when input is unbatched or
          :math:`(N, L, S)`, where :math:`N` is the batch size, :math:`L` is the target sequence length, and
          :math:`S` is the source sequence length. If ``average_attn_weights=False``, returns attention weights per
          head of shape :math:`(\text{num\_heads}, L, S)` when input is unbatched or :math:`(N, \text{num\_heads}, L, S)`.

        .. note::
            `batch_first` argument is ignored for unbatched inputs.
        """

        why_not_fast_path = ''
        if ((attn_mask is not None and torch.is_floating_point(attn_mask))
           or (key_padding_mask is not None) and torch.is_floating_point(key_padding_mask)):
            why_not_fast_path = "floating-point masks are not supported for fast path."

        is_batched = query.dim() == 3

        key_padding_mask = F._canonical_mask(
            mask=key_padding_mask,
            mask_name="key_padding_mask",
            other_type=F._none_or_dtype(attn_mask),
            other_name="attn_mask",
            target_type=query.dtype
        )

        attn_mask = F._canonical_mask(
            mask=attn_mask,
            mask_name="attn_mask",
            other_type=None,
            other_name="",
            target_type=query.dtype,
            check_other=False,
        )


        if not is_batched:
            why_not_fast_path = f"input not batched; expected query.dim() of 3 but got {query.dim()}"
        elif query is not key or key is not value:
            # When lifting this restriction, don't forget to either
            # enforce that the dtypes all match or test cases where
            # they don't!
            why_not_fast_path = "non-self attention was used (query, key, and value are not the same Tensor)"
        elif self.in_proj_bias is not None and query.dtype != self.in_proj_bias.dtype:
            why_not_fast_path = f"dtypes of query ({query.dtype}) and self.in_proj_bias ({self.in_proj_bias.dtype}) don't match"
        elif self.in_proj_weight is None:
            why_not_fast_path = "in_proj_weight was None"
        elif query.dtype != self.in_proj_weight.dtype:
            # this case will fail anyway, but at least they'll get a useful error message.
            why_not_fast_path = f"dtypes of query ({query.dtype}) and self.in_proj_weight ({self.in_proj_weight.dtype}) don't match"
        elif self.training:
            why_not_fast_path = "training is enabled"
        elif (self.num_heads % 2) != 0:
            why_not_fast_path = "self.num_heads is not even"
        elif not self.batch_first:
            why_not_fast_path = "batch_first was not True"
        elif self.bias_k is not None:
            why_not_fast_path = "self.bias_k was not None"
        elif self.bias_v is not None:
            why_not_fast_path = "self.bias_v was not None"
        elif self.add_zero_attn:
            why_not_fast_path = "add_zero_attn was enabled"
        elif not self._qkv_same_embed_dim:
            why_not_fast_path = "_qkv_same_embed_dim was not True"
        elif query.is_nested and (key_padding_mask is not None or attn_mask is not None):
            why_not_fast_path = "supplying both src_key_padding_mask and src_mask at the same time \
                                 is not supported with NestedTensor input"
        elif torch.is_autocast_enabled():
            why_not_fast_path = "autocast is enabled"

        if not why_not_fast_path:
            tensor_args = (
                query,
                key,
                value,
                self.in_proj_weight,
                self.in_proj_bias,
                self.out_proj.weight,
                self.out_proj.bias,
            )
            # We have to use list comprehensions below because TorchScript does not support
            # generator expressions.
            if torch.overrides.has_torch_function(tensor_args):
                why_not_fast_path = "some Tensor argument has_torch_function"
            elif _is_make_fx_tracing():
                why_not_fast_path = "we are running make_fx tracing"
            elif not all(_check_arg_device(x) for x in tensor_args):
                why_not_fast_path = ("some Tensor argument's device is neither one of "
                                     f"cpu, cuda or {torch.utils.backend_registration._privateuse1_backend_name}")
            elif torch.is_grad_enabled() and any(_arg_requires_grad(x) for x in tensor_args):
                why_not_fast_path = ("grad is enabled and at least one of query or the "
                                     "input/output projection weights or biases requires_grad")
            if not why_not_fast_path:
                merged_mask, mask_type = self.merge_masks(attn_mask, key_padding_mask, query)

                if self.in_proj_bias is not None and self.in_proj_weight is not None:
                    return torch._native_multi_head_attention(
                        query,
                        key,
                        value,
                        self.embed_dim,
                        self.num_heads,
                        self.in_proj_weight,
                        self.in_proj_bias,
                        self.out_proj.weight,
                        self.out_proj.bias,
                        merged_mask,
                        need_weights,
                        average_attn_weights,
                        mask_type)

        any_nested = query.is_nested or key.is_nested or value.is_nested
        assert not any_nested, ("MultiheadAttention does not support NestedTensor outside of its fast path. " +
                                f"The fast path was not hit because {why_not_fast_path}")

        if self.batch_first and is_batched:
            # make sure that the transpose op does not affect the "is" property
            if key is value:
                if query is key:
                    query = key = value = query.transpose(1, 0)
                else:
                    query, key = (x.transpose(1, 0) for x in (query, key))
                    value = key
            else:
                query, key, value = (x.transpose(1, 0) for x in (query, key, value))

        if not self._qkv_same_embed_dim:
            attn_output, attn_output_weights = multi_head_attention_forward(
                query, key, value, self.embed_dim, self.num_heads,
                self.in_proj_weight, self.in_proj_bias,
                self.bias_k, self.bias_v, self.add_zero_attn,
                self.dropout, self.out_proj.weight, self.out_proj.bias,
                training=self.training,
                key_padding_mask=key_padding_mask, need_weights=need_weights,
                attn_mask=attn_mask,
                use_separate_proj_weight=True,
                q_proj_weight=self.q_proj_weight, k_proj_weight=self.k_proj_weight,
                v_proj_weight=self.v_proj_weight,
                average_attn_weights=average_attn_weights,
                is_causal=is_causal)
        else:
            attn_output, attn_output_weights = multi_head_attention_forward(
                query, key, value, self.embed_dim, self.num_heads,
                self.in_proj_weight, self.in_proj_bias,
                self.bias_k, self.bias_v, self.add_zero_attn,
                self.dropout, self.out_proj.weight, self.out_proj.bias,
                training=self.training,
                key_padding_mask=key_padding_mask,
                need_weights=need_weights,
                attn_mask=attn_mask,
                average_attn_weights=average_attn_weights,
                is_causal=is_causal)
        if self.batch_first and is_batched:
            return attn_output.transpose(1, 0), attn_output_weights
        else:
            return attn_output, attn_output_weights


In [150]:
def scaled_dot_product_attention(query, key, value, attn_mask=None, dropout_p=0.0, is_causal=False, scale=None) -> torch.Tensor:
    # Efficient implementation equivalent to the following:
    L, S = query.size(-2), key.size(-2)
    n = query.size(0)
    scale_factor = 1 / math.sqrt(query.size(-1)) if scale is None else scale
    attn_bias = torch.zeros(L, S, dtype=query.dtype)
    device = query.device
    attn_bias = attn_bias.to(device)
    if is_causal:
        assert attn_mask is None
        temp_mask = torch.ones(L, S, dtype=torch.bool).tril(diagonal=0)
        attn_bias.masked_fill_(temp_mask.logical_not(), float("-inf"))
        attn_bias.to(query.dtype)

    if attn_mask is not None:
        if attn_mask.dtype == torch.bool:
            attn_mask.masked_fill_(attn_mask.logical_not(), float("-inf"))
        else:
            attn_bias += attn_mask

    attn_weight = query @ key.transpose(-2, -1) * scale_factor
    num_heads = attn_weight.shape[1]
    attn_weight = attn_weight.transpose(0, 1)
    attn_weight = attn_weight.transpose(1, 2) # L first
    attn_weight = attn_weight.contiguous().view(num_heads, L, -1) # collapse to shape L x N L
    attn_weight = n*attn_weight.softmax(-1) # softmax across weights across batch and positions
    attn_weight = attn_weight.view(num_heads, L, n, L).transpose(1, 2).transpose(0, 1) # transform back to N x L x L
    attn_weight_ = torch.dropout(attn_weight, dropout_p, train=True)
    return attn_weight_ @ value, attn_weight


In [137]:
n = 10
L = 40
D = 128
x = torch.rand(num_heads, n, L, D)
scaled_dot_product_attention(x, x, x)[0].shape

torch.Size([4, 10, 40, 40])


torch.Size([4, 10, 40, 128])

In [138]:
# test 
num_heads, dropout_p = 2, .1

mha = MultiheadAttention(embed_dim, num_heads, dropout=dropout_p, bias=True, add_bias_kv=False, add_zero_attn=False,
                 kdim=None, vdim=None, batch_first=False, device=device, dtype=None).to(device)

L = 10
n = 5
D = 128
x = torch.rand(L, n, D).to(device)

out, weights = mha(x, x, x, need_weights=True)

weights.sum(-1).flatten()

torch.Size([5, 2, 10, 10])


tensor([1.1531, 0.9863, 1.1001, 1.0117, 1.1051, 0.9483, 1.1189, 1.1657, 1.0410,
        1.0744, 1.0411, 0.9645, 0.9881, 0.9368, 1.0203, 0.9912, 0.9957, 1.0634,
        0.9984, 1.0368, 0.9745, 0.9968, 1.0079, 0.9595, 0.9643, 1.0874, 0.9588,
        0.9748, 0.9923, 1.0477, 0.9562, 1.0124, 0.9835, 1.0314, 1.0655, 1.0447,
        1.0406, 0.9578, 0.9914, 0.9623, 1.0062, 1.0006, 0.9162, 1.0456, 0.9138,
        0.9792, 0.8846, 1.0494, 0.8506, 0.8630, 0.9526, 1.1002, 0.9899, 1.0096,
        0.9618, 0.9983, 0.9870, 0.9719, 1.0035, 1.0174, 0.8713, 0.9887, 0.9870,
        1.0040, 1.0764, 0.9631, 0.9731, 0.8595, 1.0116, 0.9554, 1.0385, 1.0430,
        1.0392, 1.0137, 0.9921, 0.9667, 0.9985, 1.0385, 1.1281, 1.0429, 0.9949,
        1.0276, 0.9888, 0.9792, 0.9405, 1.0220, 1.0646, 0.9507, 1.1044, 1.0594,
        1.0115, 0.8798, 0.9993, 1.0085, 0.9602, 0.9991, 0.9783, 0.9684, 0.8786,
        0.9406], device='cuda:0', grad_fn=<ReshapeAliasBackward0>)

In [141]:
q, k, v = torch.rand(5, L, hidden_dim), torch.rand(5, L, hidden_dim), torch.rand(5, L, hidden_dim)
q, k, v = q.to(device), k.to(device), v.to(device)

NameError: name 'hidden_dim' is not defined

### Build Transformer

In [142]:
class Transformer_torch_MHA(nn.Module):
    def __init__(self, input_dim, hidden_dim, num_layers, num_heads, dropout_p):
        super(Transformer_torch_MHA, self).__init__()

        self.embedding = nn.Embedding(input_dim, hidden_dim)
                
        self.transformer_layers = nn.ModuleList([
            MultiheadAttention(hidden_dim, num_heads, dropout=dropout_p)
            for _ in range(num_layers)
        ])
        self.fc = nn.Linear(hidden_dim*L, 1)        
        self.sigmoid_norm = nn.BatchNorm1d(1, affine=False)        
        self.sigmoid = nn.Sigmoid()
        self.phi_scaling = nn.Linear(1, 1)
        self.sigmoid_scaling = nn.Linear(1, 1)

    def forward(self, x):

        x = self.embedding(x)
        x = x.permute(1, 0, 2)  # seq_len x batch x hidden_dim
        

        for layer in self.transformer_layers:
            x, _ = layer(x, x, x)
            
        x = x.permute(1, 0, 2)
        x = x.flatten(1)
        x = self.fc(x)  # batch x 1 (scalar)
        x = self.sigmoid_norm(x)
        x = self.sigmoid(x)
        x = self.sigmoid_scaling(x)

        return x

### Read data

In [151]:
## Standard libraries
import os
import numpy as np
import math
import json
from functools import partial

import random as rd

import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import torch
import GPUtil
import torch
import torch.nn as nn
import sys
sys.path.append('../model')
from utils import amino_acid_to_number, tokenize

device = "cuda:0"

# site specific tokenization

def get_A2N_list(seqs):
    seqs_ = list([list(seq) for seq in seqs])
    seqs__ = pd.DataFrame(seqs_)
    alphabet_by_site = [list(seqs__.iloc[:, i].unique()) for i in range(seqs__.shape[1])]
    A2N_list = [dict(zip(alphabet, range(len(alphabet)))) for alphabet in alphabet_by_site]        
    return A2N_list

def tokenize(seq):
    numeric_sequence = [A2N_list[i][seq[i]] for i in range(len(A2N_list))]
    return numeric_sequence


In [152]:
in_path = "../Data/Data_prepared/"
file_name = "Faure2023_1_lenient.csv"
datafile = pd.read_csv(in_path + file_name, index_col=None)

phenotypes = torch.tensor(list(datafile.DMS_score)).float()
phenotypes = phenotypes.unsqueeze(1)

#### Generate tokenized sequences 

A2N_list = get_A2N_list(datafile.mutated_sequence) # Get position-wise alphabet
seqs = [tokenize(mutant) for mutant in datafile.mutated_sequence]
seqs = torch.tensor(seqs)

seqs_df = pd.DataFrame(seqs.cpu().numpy())
counts = {i: seqs_df[i].value_counts() for i in range(seqs_df.shape[1])}
n_aas = [len(counts[i]) for i in range(len(counts))]
sites_var = np.where(np.array(n_aas) != 1)

seqs = seqs[:, sites_var].squeeze(1)
L = seqs.shape[1]
print(f"sequence length = {L}")

#### Generate one hot sequences

from torch.nn.functional import one_hot
seqs1h = one_hot(seqs)

AA_size = seqs1h.shape[-1]

seqs1hf = seqs1h.view(-1, L*(AA_size))

sequence length = 34


In [153]:
#### Define train test scheme
import torch
import torch.utils.data as data

class ProtDataset(data.Dataset):
    def __init__(self, feats, labels, train=True):    
        self.train = train
        self.feats = feats
        self.labels = labels
    
    def __len__(self):
        return len(self.feats)
    
    def __getitem__(self, idx):
        
        X = self.feats[idx]
        y = self.labels[idx]
        
        return X, y

# random sampling

num_train = 20000
num_test = 2000

sub_list = np.random.choice(range(len(datafile)), num_train, replace=False)
comp_list = list(set(range(len(datafile))).difference(sub_list))

train_list = sub_list
test_list = np.random.choice(comp_list, num_test, replace=False)

In [154]:
AA_size = seqs1h.shape[-1]
seqs_ex = seqs + AA_size*torch.tensor(range(L))

X = seqs_ex.to(device)
y = phenotypes.to(device)
X_train, y_train = X[train_list], y[train_list]
X_test, y_test = X[test_list], y[test_list]
train_dataset = ProtDataset(X_train, y_train)

batch_size = 1000

train_loader = data.DataLoader(train_dataset,
                               batch_size=batch_size,
                               shuffle=True,
                               drop_last=False)

### Test model

In [155]:
import numpy as np
import torch
import torch.nn as nn
import torch.optim as optim
from sklearn.datasets import load_digits
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score

In [156]:
sequence_length = L
input_dim = AA_size*L
output_dim = 1
hidden_dim = 128
num_layers = 2
num_heads = 4
dropout = 0.3

model = Transformer_torch_MHA(input_dim, hidden_dim, num_layers, num_heads, dropout).to(device)

In [None]:
#[I 2024-01-21 09:46:50,476] Trial 99 finished with value: 0.7394443620941293 and parameters: {'hidden_dim_h': 18, 'dropout': 0.1657532538257177, 'batch_size': 531}. Best is trial 94 with value: 0.7601027427382819.


In [157]:
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 500

criterion = nn.MSELoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

for epoch in range(epochs):
    model.train()
    total_loss = 0
    for batch_inputs, batch_targets in train_loader:
        optimizer.zero_grad()
        outputs = model(batch_inputs)
        loss = criterion(outputs, batch_targets)
        loss.backward()
        optimizer.step()
        total_loss += loss.item()
    
    if epoch % 1 == 0:
        print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
        model.eval()
        pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
        print(pearsonr(pred, true)[0]**2)

Epoch 1/500, Loss: 3.3160937309265135
0.48475288749033707
Epoch 2/500, Loss: 3.179739212989807
0.43134127615174056
Epoch 3/500, Loss: 3.069993495941162
0.5002596872791077
Epoch 4/500, Loss: 2.9723472476005552
0.4941023589733627
Epoch 5/500, Loss: 2.8776196241378784
0.509260613066335
Epoch 6/500, Loss: 2.7858458757400513
0.5001161398956125
Epoch 7/500, Loss: 2.6965011239051817
0.49685887761221864
Epoch 8/500, Loss: 2.609458565711975
0.5200041287813876
Epoch 9/500, Loss: 2.5257091164588927
0.5171834148894329
Epoch 10/500, Loss: 2.4429805755615233
0.5114417255188676
Epoch 11/500, Loss: 2.362980580329895
0.5410297489023641
Epoch 12/500, Loss: 2.28524044752121
0.5466060222684824
Epoch 13/500, Loss: 2.2095708727836607
0.5381723222980382
Epoch 14/500, Loss: 2.136424744129181
0.5220662354695637
Epoch 15/500, Loss: 2.0653161346912383
0.5399143844797315
Epoch 16/500, Loss: 1.9964780747890472
0.5583277894518711
Epoch 17/500, Loss: 1.929161822795868
0.5389737662733907
Epoch 18/500, Loss: 1.8643155

KeyboardInterrupt: 

### Optuna

#### 2 layers softmax

In [111]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 2
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    r2_test.append(pearsonr(pred, true)[0]**2)
    except: print("training failed")
            
    return np.array(r2_test).max()

In [112]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-19 13:33:53,368] A new study created in memory with name: no-name-27f1e852-02ba-4eb2-b77e-4df8d58fda24


Epoch 1/200, Loss: 0.35840846077505367
0.5942402176089887
Epoch 11/200, Loss: 0.18352401220654868
0.6527544121861556
Epoch 21/200, Loss: 0.12047758025218205
0.6891556706842097
Epoch 31/200, Loss: 0.09012886253466089
0.7076370447051947
Epoch 41/200, Loss: 0.07855188487524009
0.7137772601093926
Epoch 51/200, Loss: 0.07421772056315319
0.7251129839254373
Epoch 61/200, Loss: 0.0721186118492161
0.7203157801705851
Epoch 71/200, Loss: 0.0702679105641612
0.7233013654616786
Epoch 81/200, Loss: 0.06944993649979672
0.7294060059612447
Epoch 91/200, Loss: 0.06765902904142816
0.7267988873626402
Epoch 101/200, Loss: 0.06728741445814271
0.7307471902189492
Epoch 111/200, Loss: 0.06638545592326715
0.7291067562931973
Epoch 121/200, Loss: 0.06609753752688327
0.7286297080640532
Epoch 131/200, Loss: 0.06501093111842511
0.7321922948393343
Epoch 141/200, Loss: 0.06457290834332087
0.7318985482494854
Epoch 151/200, Loss: 0.06348852157951837
0.7299121722708778
Epoch 161/200, Loss: 0.06346009209393019
0.7319281521

[I 2024-01-19 13:36:04,086] Trial 0 finished with value: 0.7321922948393343 and parameters: {'hidden_dim_h': 33, 'dropout': 0.3427475660668194, 'batch_size': 241}. Best is trial 0 with value: 0.7321922948393343.


Epoch 1/200, Loss: 0.38417450142534154
0.5942531048895968
Epoch 11/200, Loss: 0.24509173827736
0.6451028844387213
Epoch 21/200, Loss: 0.1981477125694877
0.6672663238364476
Epoch 31/200, Loss: 0.1603221218836935
0.6694299530597294
Epoch 41/200, Loss: 0.15687569622930728
0.5040756523246683
Epoch 51/200, Loss: 0.16389045707489314
0.4683405239756521
Epoch 61/200, Loss: 0.17069830196468452
0.44899801207806966
Epoch 71/200, Loss: 0.16696936558735997
0.4641371448362895
Epoch 81/200, Loss: 0.16641578980182348
0.43904927213002776
Epoch 91/200, Loss: 0.16680987924337387
0.46024893896130625
Epoch 101/200, Loss: 0.15927551020132868
0.4685310331276776
Epoch 111/200, Loss: 0.16141838894078606
0.46068507981187484
Epoch 121/200, Loss: 0.1661182598848092
0.4328647434887283
Epoch 131/200, Loss: 0.1686046111740564
0.4367389871561569
Epoch 141/200, Loss: 0.17056883871555328
0.45002575122286453
Epoch 151/200, Loss: 0.16878698138814224
0.44518362750471735
Epoch 161/200, Loss: 0.16172630888851067
0.461013372

[I 2024-01-19 13:38:01,715] Trial 1 finished with value: 0.6694299530597294 and parameters: {'hidden_dim_h': 48, 'dropout': 0.295470157097074, 'batch_size': 529}. Best is trial 0 with value: 0.7321922948393343.


Epoch 1/200, Loss: 0.45792450775971283
0.597483800794112
Epoch 11/200, Loss: 0.19792803538006706
0.5009941140433507
Epoch 21/200, Loss: 0.17995964494105932
0.474777504294267
Epoch 31/200, Loss: 0.17922401146308795
0.38910702961008276
Epoch 41/200, Loss: 0.16415510447444143
0.43916190722160126
Epoch 51/200, Loss: 0.1684722107004475
0.4167365280788453
Epoch 61/200, Loss: 0.16625650166659742
0.41530944396544983
Epoch 71/200, Loss: 0.1630282400024904
0.43522742369374856
Epoch 81/200, Loss: 0.1646575386057029
0.4168357194958799
Epoch 91/200, Loss: 0.16112701896880124
0.44028160742470707
Epoch 101/200, Loss: 0.1711258572098371
0.40239432564958627
Epoch 111/200, Loss: 0.16674280327719612
0.4283791020332167
Epoch 121/200, Loss: 0.16292578002085556
0.4565999336030659
Epoch 131/200, Loss: 0.16981481478826418
0.422465920116025
Epoch 141/200, Loss: 0.16273900483911102
0.4465238563199848
Epoch 151/200, Loss: 0.16097535495017026
0.47028829068662564
Epoch 161/200, Loss: 0.16470448431131002
0.44830975

[I 2024-01-19 13:41:00,797] Trial 2 finished with value: 0.597483800794112 and parameters: {'hidden_dim_h': 44, 'dropout': 0.18581866074082476, 'batch_size': 272}. Best is trial 0 with value: 0.7321922948393343.


Epoch 1/200, Loss: 3.1970216881145133
0.5640149354461644
Epoch 11/200, Loss: 1.2907341827045788
0.5587912460687627
Epoch 21/200, Loss: 0.41269444660706955
0.6056014470196074
Epoch 31/200, Loss: 0.18274893706495113
0.6506134350211991
Epoch 41/200, Loss: 0.14197146797722035
0.6813671711202547
Epoch 51/200, Loss: 0.13059356063604355
0.7021261388683888
Epoch 61/200, Loss: 0.12079792998053811
0.7108409070479184
Epoch 71/200, Loss: 0.10928296202963049
0.7163592900602546
Epoch 81/200, Loss: 0.0993131316520951
0.7209859636985945
Epoch 91/200, Loss: 0.08945814967155456
0.7266550812870683
Epoch 101/200, Loss: 0.08060553209348158
0.7301338689441808
Epoch 111/200, Loss: 0.07382025732235475
0.7344463421742276
Epoch 121/200, Loss: 0.07079616459933194
0.7341908782892483
Epoch 131/200, Loss: 0.06735649745572697
0.7397503726099404
Epoch 141/200, Loss: 0.0655407270247286
0.7383307717108623
Epoch 151/200, Loss: 0.06378049166365103
0.7455893538725052
Epoch 161/200, Loss: 0.06373196264559572
0.741599357370

[I 2024-01-19 13:42:51,588] Trial 3 finished with value: 0.7488079993791794 and parameters: {'hidden_dim_h': 20, 'dropout': 0.25079556315541934, 'batch_size': 364}. Best is trial 3 with value: 0.7488079993791794.


Epoch 1/200, Loss: 2.828356905681331
0.5486130426962932
Epoch 11/200, Loss: 1.3396862483606107
0.584544311000373
Epoch 21/200, Loss: 0.6399482139726964
0.6468770265400119
Epoch 31/200, Loss: 0.36711998829027503
0.6797465818117914
Epoch 41/200, Loss: 0.28178113190139215
0.7017241987588633
Epoch 51/200, Loss: 0.25174227611320776
0.7094184044169679
Epoch 61/200, Loss: 0.22957068136552486
0.7175941642858942
Epoch 71/200, Loss: 0.20627473440112137
0.7184932282275207
Epoch 81/200, Loss: 0.18123583604649798
0.7212791870766497
Epoch 91/200, Loss: 0.1556839379595547
0.7300373971889168
Epoch 101/200, Loss: 0.13018629481879676
0.7391213928172021
Epoch 111/200, Loss: 0.10655186597893877
0.7364301805547598
Epoch 121/200, Loss: 0.08527196580316962
0.7409995489341047
Epoch 131/200, Loss: 0.0684361821267663
0.749332915600817
Epoch 141/200, Loss: 0.05519499947748533
0.739739388161864
Epoch 151/200, Loss: 0.046037430534275565
0.7437767727771708
Epoch 161/200, Loss: 0.03891281165727755
0.7453032114244686

[I 2024-01-19 13:44:50,901] Trial 4 finished with value: 0.749332915600817 and parameters: {'hidden_dim_h': 28, 'dropout': 0.06664068830458326, 'batch_size': 494}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 2.937785029411316
0.5257782188916493
Epoch 11/200, Loss: 1.8572537899017334
0.5494617546699307
Epoch 21/200, Loss: 1.1692418226828942
0.5898066048018956
Epoch 31/200, Loss: 0.747694751391044
0.6282024967218067
Epoch 41/200, Loss: 0.5113901335459489
0.633964010732949
Epoch 51/200, Loss: 0.3212019537503903
0.6382207827452061
Epoch 61/200, Loss: 0.23280513745087844
0.6533375909789411
Epoch 71/200, Loss: 0.19657005828160506
0.6745515063164464
Epoch 81/200, Loss: 0.18041689693927765
0.6813866393874219
Epoch 91/200, Loss: 0.17127820964042956
0.6969191583642188
Epoch 101/200, Loss: 0.16355941387323233
0.7012501623894077
Epoch 111/200, Loss: 0.155339359664
0.7136492111205953
Epoch 121/200, Loss: 0.14671796216414526
0.7176594568814408
Epoch 131/200, Loss: 0.13806774524542
0.7184735077449744
Epoch 141/200, Loss: 0.12919161354119962
0.7303637643301225
Epoch 151/200, Loss: 0.12076409705556355
0.7237311007288785
Epoch 161/200, Loss: 0.11245138198137283
0.7289330326486052
Epoch 17

[I 2024-01-19 13:46:09,948] Trial 5 finished with value: 0.74416052191544 and parameters: {'hidden_dim_h': 18, 'dropout': 0.2549870762674544, 'batch_size': 776}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 1.116234314662439
0.5751325152502081
Epoch 11/200, Loss: 0.2979825641270037
0.6139775207663314
Epoch 21/200, Loss: 0.17191941925772913
0.6677016688172212
Epoch 31/200, Loss: 0.15020203893935238
0.6886838568857087
Epoch 41/200, Loss: 0.13034278043994196
0.7087889593669185
Epoch 51/200, Loss: 0.11039935383531782
0.7206812852665743
Epoch 61/200, Loss: 0.09290418898065884
0.7238440091710466
Epoch 71/200, Loss: 0.07774381408536876
0.7277422316524533
Epoch 81/200, Loss: 0.06708359069846294
0.7361007054660109
Epoch 91/200, Loss: 0.05911569904398035
0.7392897250557134
Epoch 101/200, Loss: 0.05417048255050624
0.7393831529282977
Epoch 111/200, Loss: 0.050997755800684295
0.7383954906584843
Epoch 121/200, Loss: 0.049570240218330314
0.7363035873900544
Epoch 131/200, Loss: 0.04711718360582987
0.7377314019200862
Epoch 141/200, Loss: 0.04574267911138358
0.7461859967898774
Epoch 151/200, Loss: 0.044660368727313146
0.7432420480446328
Epoch 161/200, Loss: 0.042863813401372346
0.7446200

[I 2024-01-19 13:47:45,098] Trial 6 finished with value: 0.7461859967898774 and parameters: {'hidden_dim_h': 17, 'dropout': 0.07110237445694514, 'batch_size': 374}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 0.32788185506570533
0.6008092677823172
Epoch 11/200, Loss: 0.15076512446413276
0.6355184605379918
Epoch 21/200, Loss: 0.14995740751018288
0.5042474876262271
Epoch 31/200, Loss: 0.16951925906001544
0.4517393433794158
Epoch 41/200, Loss: 0.15931455534501154
0.4609978274017945
Epoch 51/200, Loss: 0.15832141860098134
0.4499046532209497
Epoch 61/200, Loss: 0.1692645475268364
0.4474459154732106
Epoch 71/200, Loss: 0.16783896467236223
0.44626780839637664
Epoch 81/200, Loss: 0.17052224192951546
0.44279257879322725
Epoch 91/200, Loss: 0.16431725819091328
0.45042420056757704
Epoch 101/200, Loss: 0.17453571060886147
0.426428386543459
Epoch 111/200, Loss: 0.16725749522447586
0.46232629132929437
Epoch 121/200, Loss: 0.168268226209234
0.4511406524589205
Epoch 131/200, Loss: 0.1687942415964408
0.44363622461928176
Epoch 141/200, Loss: 0.16743610432890596
0.4523802762111312
Epoch 151/200, Loss: 0.16453381994220076
0.4511170260627244
Epoch 161/200, Loss: 0.16531299323332113
0.44527051

[I 2024-01-19 13:50:52,269] Trial 7 finished with value: 0.6355184605379918 and parameters: {'hidden_dim_h': 35, 'dropout': 0.29414185759487643, 'batch_size': 164}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 0.5028997518514332
0.5816258393744258
Epoch 11/200, Loss: 0.2577162965347892
0.6263932007028155
Epoch 21/200, Loss: 0.16570561339980677
0.6633031423656678
Epoch 31/200, Loss: 0.13903933841931193
0.683492106109344
Epoch 41/200, Loss: 0.1277555470403872
0.7045315006644756
Epoch 51/200, Loss: 0.12160271563028034
0.7180227210079041
Epoch 61/200, Loss: 0.11551680141373684
0.7214861809821368
Epoch 71/200, Loss: 0.10862451164345992
0.7209319809352295
Epoch 81/200, Loss: 0.10223317812932164
0.7245261505131927
Epoch 91/200, Loss: 0.09722330029073514
0.729477708499443
Epoch 101/200, Loss: 0.09086323882404126
0.7316120554006286
Epoch 111/200, Loss: 0.08592575278721358
0.7369032023053491
Epoch 121/200, Loss: 0.08223019736377817
0.7344848006334652
Epoch 131/200, Loss: 0.07734654373244236
0.7313934956911656
Epoch 141/200, Loss: 0.0725661437762411
0.7341224187236459
Epoch 151/200, Loss: 0.06897193997314102
0.7427916853523933
Epoch 161/200, Loss: 0.06459150169240802
0.74568404432938

[I 2024-01-19 13:52:48,018] Trial 8 finished with value: 0.7456840443293852 and parameters: {'hidden_dim_h': 38, 'dropout': 0.2713466781876055, 'batch_size': 1105}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 2.0567384693357678
0.5492600390773713
Epoch 11/200, Loss: 1.3948338164223566
0.5482073145962026
Epoch 21/200, Loss: 0.9545247422324287
0.5930979879004596
Epoch 31/200, Loss: 0.6569256948100196
0.6406392105984079
Epoch 41/200, Loss: 0.46596896317270065
0.6670016085706548
Epoch 51/200, Loss: 0.3510819441742367
0.6672335720211693
Epoch 61/200, Loss: 0.2872005005677541
0.6960094358308113
Epoch 71/200, Loss: 0.2527240787943204
0.7022347874630348
Epoch 81/200, Loss: 0.23361251006523767
0.7073217706017345
Epoch 91/200, Loss: 0.2217054060763783
0.7153029009465377
Epoch 101/200, Loss: 0.21212347431315315
0.7127319450408991
Epoch 111/200, Loss: 0.20328555835617912
0.7224467772042362
Epoch 121/200, Loss: 0.19455233050717247
0.7283852867594856
Epoch 131/200, Loss: 0.18518667916456857
0.7252712741987828
Epoch 141/200, Loss: 0.17568165477779177
0.7283522636297284
Epoch 151/200, Loss: 0.1660392830769221
0.7270198262441635
Epoch 161/200, Loss: 0.15619253946675193
0.738434410684802
E

[I 2024-01-19 13:54:12,566] Trial 9 finished with value: 0.7424157769866739 and parameters: {'hidden_dim_h': 22, 'dropout': 0.17103790564950988, 'batch_size': 1127}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 0.5392275430538036
0.5729961789752311
Epoch 11/200, Loss: 0.20709907898196467
0.6469701464980144
Epoch 21/200, Loss: 0.1274851229455736
0.6879508837908045
Epoch 31/200, Loss: 0.11005940095142082
0.7162780928225582
Epoch 41/200, Loss: 0.0989325695015766
0.7204647096965249
Epoch 51/200, Loss: 0.09092856557280929
0.7289556406007192
Epoch 61/200, Loss: 0.08148983507244675
0.7273866274198602
Epoch 71/200, Loss: 0.07229863079609694
0.7264373909532764
Epoch 81/200, Loss: 0.06549122184515
0.7320107876721902
Epoch 91/200, Loss: 0.058091091337027376
0.728653874189373
Epoch 101/200, Loss: 0.05181480171503844
0.7263363168880399
Epoch 111/200, Loss: 0.04746149576924465
0.7327491627189964
Epoch 121/200, Loss: 0.041899925028836285
0.7363932016538467
Epoch 131/200, Loss: 0.03881059683583401
0.7339329785579378
Epoch 141/200, Loss: 0.03646012299038746
0.7351450142159432
Epoch 151/200, Loss: 0.03431829451410859
0.7352240687650015
Epoch 161/200, Loss: 0.03324682927793927
0.7405294345279

[I 2024-01-19 13:55:48,004] Trial 10 finished with value: 0.7405294345279639 and parameters: {'hidden_dim_h': 27, 'dropout': 0.06260208143425046, 'batch_size': 765}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 0.5805460065603256
0.5377149281653916
Epoch 11/200, Loss: 0.2495770621157828
0.6165464174322776
Epoch 21/200, Loss: 0.21001173023666656
0.6415120360271153
Epoch 31/200, Loss: 0.17949893751314708
0.6667190840771362
Epoch 41/200, Loss: 0.14935055765367689
0.6870279522342632
Epoch 51/200, Loss: 0.12351380395037788
0.6938621165911707
Epoch 61/200, Loss: 0.10324000389803023
0.7112609570542209
Epoch 71/200, Loss: 0.08835730453332265
0.702766013541109
Epoch 81/200, Loss: 0.07772122891176314
0.722338008893779
Epoch 91/200, Loss: 0.07109964328507583
0.731545549395032
Epoch 101/200, Loss: 0.06717561557888985
0.7354649896475227
Epoch 111/200, Loss: 0.06492217505971591
0.7404164159693911
Epoch 121/200, Loss: 0.06352209042580355
0.7398238597911676
Epoch 131/200, Loss: 0.06151555780143965
0.7418240303454781
Epoch 141/200, Loss: 0.0610111699040447
0.7458952465980356
Epoch 151/200, Loss: 0.06073606865746634
0.7396848545859974
Epoch 161/200, Loss: 0.059734346699856576
0.7425228485467

[I 2024-01-19 13:57:11,107] Trial 11 finished with value: 0.7458952465980356 and parameters: {'hidden_dim_h': 10, 'dropout': 0.12889403926954968, 'batch_size': 482}. Best is trial 4 with value: 0.749332915600817.


Epoch 1/200, Loss: 0.19933388262025772
0.5812875856707431
Epoch 11/200, Loss: 0.14859748030862502
0.6564500036067646
Epoch 21/200, Loss: 0.12054379092108819
0.6965362399866238
Epoch 31/200, Loss: 0.09770158365849525
0.7191796101963676
Epoch 41/200, Loss: 0.08240917685531801
0.7392296996825987
Epoch 51/200, Loss: 0.06976958568538388
0.7455087744749315
Epoch 61/200, Loss: 0.06282012693343623
0.7494876964061838
Epoch 71/200, Loss: 0.05640531102976491
0.7463540936336083
Epoch 81/200, Loss: 0.05345879963809444
0.7505852323183163
Epoch 91/200, Loss: 0.04967664290339716
0.7497648128377301
Epoch 101/200, Loss: 0.04787215422238073
0.7590118470647331
Epoch 111/200, Loss: 0.045998437991065365
0.7544016775113378
Epoch 121/200, Loss: 0.04453376752714957
0.7555352264094883
Epoch 131/200, Loss: 0.0425771165999674
0.7628955979656156
Epoch 141/200, Loss: 0.041782708538155404
0.7511088611658139
Epoch 151/200, Loss: 0.041195749034804684
0.7603865401423645
Epoch 161/200, Loss: 0.04050676176144231
0.757864

[I 2024-01-19 13:58:50,623] Trial 12 finished with value: 0.7631697671609307 and parameters: {'hidden_dim_h': 27, 'dropout': 0.13162897451116728, 'batch_size': 646}. Best is trial 12 with value: 0.7631697671609307.


Epoch 1/200, Loss: 2.078453560670217
0.5493481024277065
Epoch 11/200, Loss: 1.1686346292495728
0.34901434764290734
Epoch 21/200, Loss: 0.5631678322950999
0.6180260496563333
Epoch 31/200, Loss: 0.28889922400315604
0.6668059567088432
Epoch 41/200, Loss: 0.18288954198360444
0.7028571999533413
Epoch 51/200, Loss: 0.14615726768970488
0.7124719876295696
Epoch 61/200, Loss: 0.1332363006969293
0.7196236741412677
Epoch 71/200, Loss: 0.12446391408642134
0.7280869613925314
Epoch 81/200, Loss: 0.11645706767837206
0.7372209887956527
Epoch 91/200, Loss: 0.10890826558073362
0.745444864591192
Epoch 101/200, Loss: 0.10055184712012609
0.7494033075909493
Epoch 111/200, Loss: 0.09244343464573225
0.7492140191139129
Epoch 121/200, Loss: 0.08355546121795972
0.7525072271913736
Epoch 131/200, Loss: 0.07604481900731723
0.7527438304785353
Epoch 141/200, Loss: 0.06869882109264533
0.7491649731772514
Epoch 151/200, Loss: 0.06210214669505755
0.7546547050399941
Epoch 161/200, Loss: 0.056251246854662894
0.755616658702

[I 2024-01-19 14:00:34,251] Trial 13 finished with value: 0.7628167993877022 and parameters: {'hidden_dim_h': 27, 'dropout': 0.11592526293219417, 'batch_size': 680}. Best is trial 12 with value: 0.7631697671609307.


Epoch 1/200, Loss: 0.3813164220614867
0.5727698218371285
Epoch 11/200, Loss: 0.25614193691448733
0.6446936237685675
Epoch 21/200, Loss: 0.22436424209312958
0.6812075627993797
Epoch 31/200, Loss: 0.19621278006922116
0.7033659301551166
Epoch 41/200, Loss: 0.16901225461201233
0.7162884993713466
Epoch 51/200, Loss: 0.14432663131843915
0.7293665873663047
Epoch 61/200, Loss: 0.12272112545641986
0.74368160088293


[I 2024-01-19 14:01:04,140] Trial 14 finished with value: 0.74368160088293 and parameters: {'hidden_dim_h': 27, 'dropout': 0.12554222480884783, 'batch_size': 916}. Best is trial 12 with value: 0.7631697671609307.


training failed
Epoch 1/200, Loss: 2.140313033014536
0.557151803526926
Epoch 11/200, Loss: 1.1156439147889614
0.6212814833980538
Epoch 21/200, Loss: 0.5970610622316599
0.656059772339312
Epoch 31/200, Loss: 0.3689616248011589
0.6928546945143783
Epoch 41/200, Loss: 0.28518639598041773
0.7130288480975008
Epoch 51/200, Loss: 0.2538530621677637
0.7244513321146328


[I 2024-01-19 14:01:37,709] Trial 15 finished with value: 0.7244513321146328 and parameters: {'hidden_dim_h': 40, 'dropout': 0.13527968507889804, 'batch_size': 641}. Best is trial 12 with value: 0.7631697671609307.


training failed
Epoch 1/200, Loss: 0.5067801800641146
0.5635105397148698


[I 2024-01-19 14:01:40,626] Trial 16 finished with value: 0.5635105397148698 and parameters: {'hidden_dim_h': 24, 'dropout': 0.10279175136344948, 'batch_size': 918}. Best is trial 12 with value: 0.7631697671609307.


training failed
training failed


[W 2024-01-19 14:01:40,818] Trial 17 failed with parameters: {'hidden_dim_h': 13, 'dropout': 0.17354865487671933, 'batch_size': 706} because of the following error: ValueError('zero-size array to reduction operation maximum which has no identity').
Traceback (most recent call last):
  File "/home/juannanzhou/.local/lib/python3.10/site-packages/optuna/study/_optimize.py", line 200, in _run_trial
    value_or_values = func(trial)
  File "/scratch/local/21743416/ipykernel_2182428/1032276540.py", line 55, in objective
    return np.array(r2_test).max()
  File "/apps/pytorch/2.0.1/lib/python3.10/site-packages/numpy/core/_methods.py", line 41, in _amax
    return umr_maximum(a, axis, None, out, keepdims, initial, where)
ValueError: zero-size array to reduction operation maximum which has no identity
[W 2024-01-19 14:01:40,851] Trial 17 failed with value None.


ValueError: zero-size array to reduction operation maximum which has no identity

#### 2 layers no softmax

In [122]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 2
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    r2_test.append(pearsonr(pred, true)[0]**2)
    except: print("training failed")
            
    return np.array(r2_test).max()

In [123]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-19 14:08:43,373] A new study created in memory with name: no-name-f49c2b07-7fc1-43f0-be22-9e7ef458829e


Epoch 1/200, Loss: 3.302435874938965
0.5308911542826704
Epoch 11/200, Loss: 2.025254575411479
0.6018419162380462
Epoch 21/200, Loss: 1.2291974584261576
0.6492671089870524
Epoch 31/200, Loss: 0.6863061547279358
0.626043205558727
Epoch 41/200, Loss: 0.3684600522120794
0.6840951003557086
Epoch 51/200, Loss: 0.22365091145038604
0.703078217474124
Epoch 61/200, Loss: 0.16451507111390432
0.7241036554471962
Epoch 71/200, Loss: 0.1415091556807359
0.722826526468209
Epoch 81/200, Loss: 0.130874947955211
0.7212657023835715
Epoch 91/200, Loss: 0.1233563410739104
0.725610932095042
Epoch 101/200, Loss: 0.11563581054409346
0.7255565733831083
Epoch 111/200, Loss: 0.10813507239023844
0.7295461654231327
Epoch 121/200, Loss: 0.10005675728122393
0.7312926679404769
Epoch 131/200, Loss: 0.09238090763489405
0.7331562594056626
Epoch 141/200, Loss: 0.08438843041658402
0.729611895726436
Epoch 151/200, Loss: 0.07723999818166097
0.7381485441506068
Epoch 161/200, Loss: 0.06988784559071064
0.7324469302584263
Epoch 1

[I 2024-01-19 14:10:03,482] Trial 0 finished with value: 0.7381485441506068 and parameters: {'hidden_dim_h': 18, 'dropout': 0.25713024730311235, 'batch_size': 669}. Best is trial 0 with value: 0.7381485441506068.


Epoch 1/200, Loss: 0.24791812738205524
0.6274995808585263
Epoch 11/200, Loss: 0.11440799232070328
0.7045982781257514
Epoch 21/200, Loss: 0.07430940982720531
0.7198764984878808
Epoch 31/200, Loss: 0.0613176907207949
0.7286122430831775
Epoch 41/200, Loss: 0.056457984901911826
0.7300068053681393
Epoch 51/200, Loss: 0.05331549246577506
0.7266036162997447
Epoch 61/200, Loss: 0.04970676420216865
0.7394314448577997
Epoch 71/200, Loss: 0.04787201966746902
0.739412833871484
Epoch 81/200, Loss: 0.046070046035955985
0.7339487993917846
Epoch 91/200, Loss: 0.0448397224016012
0.7320833850957544
Epoch 101/200, Loss: 0.04266923852264881
0.7311151068895683
Epoch 111/200, Loss: 0.04154934871492656
0.7322427993464045
Epoch 121/200, Loss: 0.04011028920505064
0.7346974878672058
Epoch 131/200, Loss: 0.03974673749073177
0.7357730840662974
Epoch 141/200, Loss: 0.03768137216250947
0.7311563859191648
Epoch 151/200, Loss: 0.03764295852776115
0.7306022489892205
Epoch 161/200, Loss: 0.035953093439023545
0.73154734

[I 2024-01-19 14:13:17,405] Trial 1 finished with value: 0.7394314448577997 and parameters: {'hidden_dim_h': 29, 'dropout': 0.2939796738858717, 'batch_size': 142}. Best is trial 1 with value: 0.7394314448577997.


Epoch 1/200, Loss: 0.4930994709332784
0.6215462896046233
Epoch 11/200, Loss: 0.29121141756574315
0.72558411374878
Epoch 21/200, Loss: 0.24229617851475874
0.7277727065222911
Epoch 31/200, Loss: 0.2124030701816082
0.7182545669179807
Epoch 41/200, Loss: 0.18159960707028708
0.72932911404751
Epoch 51/200, Loss: 0.1521769439180692
0.7220343458124047
Epoch 61/200, Loss: 0.12590184962997833
0.7326698550949159
Epoch 71/200, Loss: 0.10241188916067283
0.7223246190925238
Epoch 81/200, Loss: 0.08233033679425716
0.722975680253712
Epoch 91/200, Loss: 0.06658460727582376
0.7293989413550851
Epoch 101/200, Loss: 0.05286577887212237
0.7343829139857782
Epoch 111/200, Loss: 0.043007458870609604
0.7216824456259899
Epoch 121/200, Loss: 0.034567254750678934
0.7292683446128276
Epoch 131/200, Loss: 0.028721813422938187
0.7305908585465306
Epoch 141/200, Loss: 0.02491699104818205
0.7287525852310505
Epoch 151/200, Loss: 0.021888718164215486
0.7221396065158281
Epoch 161/200, Loss: 0.019863406584287684
0.71974219529

[I 2024-01-19 14:14:58,644] Trial 2 finished with value: 0.7343829139857782 and parameters: {'hidden_dim_h': 38, 'dropout': 0.09568280683286604, 'batch_size': 853}. Best is trial 1 with value: 0.7394314448577997.


Epoch 1/200, Loss: 0.3206292192141215
0.6198732063004163
Epoch 11/200, Loss: 0.22671127369006475
0.706887556393749
Epoch 21/200, Loss: 0.1787787616252899
0.71700371123731
Epoch 31/200, Loss: 0.13781916002432507
0.7238934155384349
Epoch 41/200, Loss: 0.1060157634317875
0.7318468927438985
Epoch 51/200, Loss: 0.08178697029749553
0.7315001717991627
Epoch 61/200, Loss: 0.06508440524339676
0.7308616517625314
Epoch 71/200, Loss: 0.05319201201200485
0.7413485252244962
Epoch 81/200, Loss: 0.04633296777804693
0.7238704275734009
Epoch 91/200, Loss: 0.04078692644834518
0.7282296137477061
Epoch 101/200, Loss: 0.037907998884717624
0.7268224072094445
Epoch 111/200, Loss: 0.035555809177458285
0.7257433956316581
Epoch 121/200, Loss: 0.034036731844147045
0.734859029467267
Epoch 131/200, Loss: 0.03267027083784342
0.725607526347893
Epoch 141/200, Loss: 0.031964327519138656
0.72776131638822
Epoch 151/200, Loss: 0.03131657553215821
0.7254192419315265
Epoch 161/200, Loss: 0.03028765128304561
0.73174873283814

[I 2024-01-19 14:16:50,599] Trial 3 finished with value: 0.7413485252244962 and parameters: {'hidden_dim_h': 46, 'dropout': 0.3186724630088547, 'batch_size': 681}. Best is trial 3 with value: 0.7413485252244962.


Epoch 1/200, Loss: 0.5714413821697235
0.5701581180880625
Epoch 11/200, Loss: 0.32798973553710514
0.6623599993902293
Epoch 21/200, Loss: 0.23692849940723842
0.685684524555334
Epoch 31/200, Loss: 0.20386662748124865
0.7006204785019543
Epoch 41/200, Loss: 0.18960525426599714
0.71250321483149
Epoch 51/200, Loss: 0.17476330366399553
0.710392317714121
Epoch 61/200, Loss: 0.16034003181589973
0.717549794004976
Epoch 71/200, Loss: 0.14663392305374146
0.7178988412308092
Epoch 81/200, Loss: 0.13251289394166735
0.727545602662253
Epoch 91/200, Loss: 0.11998234937588374
0.717885203877996
Epoch 101/200, Loss: 0.10744530335068703
0.7266600807965251
Epoch 111/200, Loss: 0.09569302284055287
0.7265437037842492
Epoch 121/200, Loss: 0.08645448999272452
0.7305047841061766
Epoch 131/200, Loss: 0.07642814682589637
0.7264956309711197
Epoch 141/200, Loss: 0.06844421269165145
0.7303544082233557
Epoch 151/200, Loss: 0.062486418005492955
0.7335636220749102
Epoch 161/200, Loss: 0.05597487878468302
0.724597253898739

[I 2024-01-19 14:18:08,534] Trial 4 finished with value: 0.7335636220749102 and parameters: {'hidden_dim_h': 14, 'dropout': 0.11837994799432536, 'batch_size': 1162}. Best is trial 3 with value: 0.7413485252244962.


Epoch 1/200, Loss: 0.6753604098370201
0.5789567850529608
Epoch 11/200, Loss: 0.3260961833753084
0.6448197748815019
Epoch 21/200, Loss: 0.1723339651760302
0.6850053539083069
Epoch 31/200, Loss: 0.10998849335469697
0.7030546822579561
Epoch 41/200, Loss: 0.08972274159130297
0.7225561071003422
Epoch 51/200, Loss: 0.08188448258136448
0.7197502749691013
Epoch 61/200, Loss: 0.07836849516943882
0.7214143284726867
Epoch 71/200, Loss: 0.07510137754051309
0.7269517609099008
Epoch 81/200, Loss: 0.07243980624173817
0.7213353601942913
Epoch 91/200, Loss: 0.06929669215490944
0.7228000539956845
Epoch 101/200, Loss: 0.06674939197929282
0.7229638718372603
Epoch 111/200, Loss: 0.06401550436490461
0.7208216109382333
Epoch 121/200, Loss: 0.061626959199968134
0.7231254062065968
Epoch 131/200, Loss: 0.05950837660776941
0.7243057677364481
Epoch 141/200, Loss: 0.05756943849356551
0.7226783505819931
Epoch 151/200, Loss: 0.055237108939572385
0.7278392208036372
Epoch 161/200, Loss: 0.054198345855662695
0.72255958

[I 2024-01-19 14:19:05,060] Trial 5 finished with value: 0.7278392208036372 and parameters: {'hidden_dim_h': 12, 'dropout': 0.17625589215082677, 'batch_size': 1092}. Best is trial 3 with value: 0.7413485252244962.


Epoch 1/200, Loss: 0.9881240763971882
0.5829532466835686
Epoch 11/200, Loss: 0.3959209121042682
0.6542318491107235
Epoch 21/200, Loss: 0.19026524405325612
0.6972460861503063
Epoch 31/200, Loss: 0.13497132567628736
0.7124680454921895
Epoch 41/200, Loss: 0.1219415775229854
0.7191681565097309
Epoch 51/200, Loss: 0.11483543870910522
0.7230909838353241
Epoch 61/200, Loss: 0.10574332985185808
0.7220392654566279
Epoch 71/200, Loss: 0.09841079144708571
0.7337749014569527
Epoch 81/200, Loss: 0.08947719152896635
0.7331731614297696
Epoch 91/200, Loss: 0.0831624279099126
0.7319051552806582
Epoch 101/200, Loss: 0.07604105362007695
0.7349874186925553
Epoch 111/200, Loss: 0.06951910978363406
0.7367080741155325
Epoch 121/200, Loss: 0.06419700972976224
0.7373976663212519
Epoch 131/200, Loss: 0.059476097504938805
0.7340450521907561
Epoch 141/200, Loss: 0.055118574129958305
0.7417409323487476
Epoch 151/200, Loss: 0.052782077342271805
0.7350120834340264
Epoch 161/200, Loss: 0.05075709617907001
0.736409447

[I 2024-01-19 14:19:58,163] Trial 6 finished with value: 0.7417409323487476 and parameters: {'hidden_dim_h': 16, 'dropout': 0.3130445730867097, 'batch_size': 664}. Best is trial 6 with value: 0.7417409323487476.


Epoch 1/200, Loss: 0.18282867426222021
0.5754290238222298
Epoch 11/200, Loss: 0.13076757165518674
0.6711105464449293
Epoch 21/200, Loss: 0.10722932727499442
0.6974215567210353
Epoch 31/200, Loss: 0.09072175080125983
0.7038704416662404
Epoch 41/200, Loss: 0.08009439503604715
0.7125226568673058
Epoch 51/200, Loss: 0.071675797755068
0.7171114998968107
Epoch 61/200, Loss: 0.06675242547961799
0.7170794055875905
Epoch 71/200, Loss: 0.06315856731750748
0.7167995416466671
Epoch 81/200, Loss: 0.0607633919201114
0.7178874537327465
Epoch 91/200, Loss: 0.05803247337991541
0.7227447284274051
Epoch 101/200, Loss: 0.057640867815776306
0.7196071384280391
Epoch 111/200, Loss: 0.055372321300885895
0.7174881705158933
Epoch 121/200, Loss: 0.054620030082084915
0.7152420948653653
Epoch 131/200, Loss: 0.054053793915293434
0.7206311254026603
Epoch 141/200, Loss: 0.052809547294269905
0.7180933304611129
Epoch 151/200, Loss: 0.052417578852989456
0.7222594505502449
Epoch 161/200, Loss: 0.051910009743137794
0.7196

[I 2024-01-19 14:20:46,980] Trial 7 finished with value: 0.7249859842826948 and parameters: {'hidden_dim_h': 11, 'dropout': 0.19741471866287458, 'batch_size': 918}. Best is trial 6 with value: 0.7417409323487476.


Epoch 1/200, Loss: 0.7239214239581939
0.5965123065778676
Epoch 11/200, Loss: 0.3105321084299395
0.6943940999517767
Epoch 21/200, Loss: 0.21296096569107426
0.7181154745093313
Epoch 31/200, Loss: 0.18687814281832787
0.7192147573773118
Epoch 41/200, Loss: 0.16715858492159075
0.7205318255517019
Epoch 51/200, Loss: 0.14645117857763845
0.7238987477111952
Epoch 61/200, Loss: 0.12620324737602664
0.7254126029669654
Epoch 71/200, Loss: 0.1076860870084455
0.7294818325088885
Epoch 81/200, Loss: 0.09055986567851036
0.7307186214348806
Epoch 91/200, Loss: 0.07685517207268745
0.7372167194690797
Epoch 101/200, Loss: 0.06584232456741794
0.7328116460544929
Epoch 111/200, Loss: 0.05680372902462559
0.7334345817313593
Epoch 121/200, Loss: 0.0500854181666528
0.7261068635555632
Epoch 131/200, Loss: 0.04541085083638468
0.7289965645516796
Epoch 141/200, Loss: 0.04257623598940911
0.7278895146610838
Epoch 151/200, Loss: 0.040415349266221444
0.7313246361048236
Epoch 161/200, Loss: 0.03868998226619536
0.72657289027

[I 2024-01-19 14:21:42,536] Trial 8 finished with value: 0.7372167194690797 and parameters: {'hidden_dim_h': 20, 'dropout': 0.2408789743191922, 'batch_size': 654}. Best is trial 6 with value: 0.7417409323487476.


Epoch 1/200, Loss: 0.21662377483314937
0.6207368694760359
Epoch 11/200, Loss: 0.13850385198990503
0.7127189204266968
Epoch 21/200, Loss: 0.11983777706821759
0.724916722621459
Epoch 31/200, Loss: 0.102750975638628
0.7329111901918088
Epoch 41/200, Loss: 0.08744868801699744
0.7290428192239938
Epoch 51/200, Loss: 0.07494383884800805
0.7266884764004434
Epoch 61/200, Loss: 0.06417251171337233
0.7237609721661272
Epoch 71/200, Loss: 0.05567478243675497
0.7298278745615662
Epoch 81/200, Loss: 0.04923122624556223
0.7280714753497269
Epoch 91/200, Loss: 0.04443941927618451
0.7272720721668113
Epoch 101/200, Loss: 0.040549071298705205
0.7224083857045341
Epoch 111/200, Loss: 0.0378371292932166
0.7205350538183416
Epoch 121/200, Loss: 0.035905069982012115
0.7202710345425194
Epoch 131/200, Loss: 0.033710268429583974
0.7232565254408004
Epoch 141/200, Loss: 0.03236611353026496
0.723623753563998
Epoch 151/200, Loss: 0.031340476435919605
0.7244719408255084
Epoch 161/200, Loss: 0.030698993967639074
0.72185411

[I 2024-01-19 14:22:47,386] Trial 9 finished with value: 0.7329111901918088 and parameters: {'hidden_dim_h': 38, 'dropout': 0.2918899435318971, 'batch_size': 1123}. Best is trial 6 with value: 0.7417409323487476.


Epoch 1/200, Loss: 0.20301057360594785
0.6217604624654529
Epoch 11/200, Loss: 0.10537262581571748
0.7030934586117531
Epoch 21/200, Loss: 0.08124458855843242
0.7194460755650753
Epoch 31/200, Loss: 0.0682350186796128
0.724903477777258
Epoch 41/200, Loss: 0.06268058783268626
0.7257164105847698
Epoch 51/200, Loss: 0.058391429672512825
0.7216065704972086
Epoch 61/200, Loss: 0.05457319687061672
0.7259380897932008
Epoch 71/200, Loss: 0.05331346798169462
0.7340508957801224
Epoch 81/200, Loss: 0.050467954642033276
0.7292132435707579
Epoch 91/200, Loss: 0.04904599138830282
0.7348022901945737
Epoch 101/200, Loss: 0.0473351703980301
0.7302548747981816
Epoch 111/200, Loss: 0.04542273971476132
0.7354475393023784
Epoch 121/200, Loss: 0.044808541389205786
0.7332876855024094
Epoch 131/200, Loss: 0.04316773586258103
0.7364906932448962
Epoch 141/200, Loss: 0.0427874749691426
0.7368078152552884
Epoch 151/200, Loss: 0.042251333452855484
0.7358670546974537
Epoch 161/200, Loss: 0.04113366405326355
0.73275536

[I 2024-01-19 14:24:05,721] Trial 10 finished with value: 0.7368078152552884 and parameters: {'hidden_dim_h': 25, 'dropout': 0.3463302106667126, 'batch_size': 255}. Best is trial 6 with value: 0.7417409323487476.


Epoch 1/200, Loss: 0.9190086608237409
0.5824255764675154
Epoch 11/200, Loss: 0.3600485971633424
0.6296738300093909
Epoch 21/200, Loss: 0.2074027400701604
0.6515377598018871
Epoch 31/200, Loss: 0.18018494673231814
0.685015854946426
Epoch 41/200, Loss: 0.15555718128985546
0.7068412631245561
Epoch 51/200, Loss: 0.13133313538546257
0.7190826501477556
Epoch 61/200, Loss: 0.1089110716860345
0.7334943461206512
Epoch 71/200, Loss: 0.09056270994404529
0.732547431044154
Epoch 81/200, Loss: 0.07530305288890575
0.729014522970509
Epoch 91/200, Loss: 0.06491460690790034
0.7331884882933206
Epoch 101/200, Loss: 0.05759265345144779
0.7382384341787528
Epoch 111/200, Loss: 0.052415165733149714
0.7362546413984236
Epoch 121/200, Loss: 0.049656328527217214
0.7317976810586376
Epoch 131/200, Loss: 0.04693615729821489
0.7385986260349868
Epoch 141/200, Loss: 0.045189698167303775
0.7394792084185706
Epoch 151/200, Loss: 0.044597845841595464
0.7427472413365445
Epoch 161/200, Loss: 0.04279653410962288
0.73844451643

[I 2024-01-19 14:25:27,955] Trial 11 finished with value: 0.7427472413365445 and parameters: {'hidden_dim_h': 49, 'dropout': 0.3488598777160132, 'batch_size': 429}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.2530737444758415
0.6297547687349077
Epoch 11/200, Loss: 0.16336081306571545
0.7040941809510899
Epoch 21/200, Loss: 0.12648975201275037
0.720992087640687
Epoch 31/200, Loss: 0.09523170570964398
0.7255985064875695
Epoch 41/200, Loss: 0.07372148796592069
0.7270512718568847
Epoch 51/200, Loss: 0.059267915218420654
0.7346493871833649
Epoch 61/200, Loss: 0.0502274201615997
0.7213201846721696
Epoch 71/200, Loss: 0.04551157962692821
0.7283136261965069
Epoch 81/200, Loss: 0.041625047345524246
0.7304857290618704
Epoch 91/200, Loss: 0.03933548570975014
0.7250276014450184
Epoch 101/200, Loss: 0.03803222982779793
0.7273487130099066
Epoch 111/200, Loss: 0.03664495050907135
0.7269743982890553
Epoch 121/200, Loss: 0.036283719515346965
0.7308875889717711
Epoch 131/200, Loss: 0.034872473581977516
0.7254224441481576
Epoch 141/200, Loss: 0.03420455628277167
0.724434040883552
Epoch 151/200, Loss: 0.03352405551982963
0.7290033122807015
Epoch 161/200, Loss: 0.03257184674072525
0.72130811

[I 2024-01-19 14:26:44,724] Trial 12 finished with value: 0.7346493871833649 and parameters: {'hidden_dim_h': 43, 'dropout': 0.3414737904564971, 'batch_size': 441}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 1.6353289630677965
0.5504596313522614
Epoch 11/200, Loss: 0.5331132140424516
0.6812025845708223
Epoch 21/200, Loss: 0.18037163317203522
0.7220578075934297
Epoch 31/200, Loss: 0.10618367625607385
0.7323242154543458
Epoch 41/200, Loss: 0.09099276694986555
0.732424301891487
Epoch 51/200, Loss: 0.08190439724259907
0.7328473334476177
Epoch 61/200, Loss: 0.07340598288509581
0.7340311574833565
Epoch 71/200, Loss: 0.06491696644160483
0.7414941349074715
Epoch 81/200, Loss: 0.05647903225488133
0.7355881486579909
Epoch 91/200, Loss: 0.04950286986099349
0.7293234162287686
Epoch 101/200, Loss: 0.04290440123942163
0.7359101040740911
Epoch 111/200, Loss: 0.03838294628593657
0.7292739249684403
Epoch 121/200, Loss: 0.034205109833015335
0.7277663482628574
Epoch 131/200, Loss: 0.03163267556164
0.7353717532798669
Epoch 141/200, Loss: 0.030153160997562937
0.72542357179112
Epoch 151/200, Loss: 0.029245378408167096
0.7293790419596051
Epoch 161/200, Loss: 0.028851420018408035
0.730668983411

[I 2024-01-19 14:27:55,221] Trial 13 finished with value: 0.7414941349074715 and parameters: {'hidden_dim_h': 37, 'dropout': 0.2497489844171477, 'batch_size': 447}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.7365846607996069
0.5970994683543526
Epoch 11/200, Loss: 0.16246062808710596
0.7113355319181683
Epoch 21/200, Loss: 0.08557492041069528
0.7238999675464352
Epoch 31/200, Loss: 0.07390604346342709
0.7320241942850306
Epoch 41/200, Loss: 0.06540960389310899
0.7339559230351074
Epoch 51/200, Loss: 0.057939829466783485
0.7321418971121749
Epoch 61/200, Loss: 0.05134825189800366
0.7340632611424076
Epoch 71/200, Loss: 0.045389054586058075
0.7281072970371127
Epoch 81/200, Loss: 0.04136126269788846
0.7265867980429637
Epoch 91/200, Loss: 0.03785707833974258
0.731433954771371
Epoch 101/200, Loss: 0.034988612786907215
0.7333183251474573
Epoch 111/200, Loss: 0.03282395086210707
0.7303763118470792
Epoch 121/200, Loss: 0.03239884640535583
0.7248491901478276
Epoch 131/200, Loss: 0.030816125481025032
0.7196246476261875
Epoch 141/200, Loss: 0.02967696819130493
0.7256002071826931
Epoch 151/200, Loss: 0.02987097936641911
0.7224530329449618
Epoch 161/200, Loss: 0.028698474938130897
0.72624

[I 2024-01-19 14:29:17,293] Trial 14 finished with value: 0.7340632611424076 and parameters: {'hidden_dim_h': 50, 'dropout': 0.2920120823440834, 'batch_size': 442}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.3846324714832008
0.622907602903677
Epoch 11/200, Loss: 0.1737266245763749
0.7052969399507799
Epoch 21/200, Loss: 0.11962106660939753
0.7307167476653307
Epoch 31/200, Loss: 0.07841731840744615
0.7326974457696372
Epoch 41/200, Loss: 0.053872177843004465
0.7349123200098928
Epoch 51/200, Loss: 0.04134240286657587
0.7340680548996004
Epoch 61/200, Loss: 0.034826280520064756
0.7355854042614565
Epoch 71/200, Loss: 0.03301383153302595
0.7254799183489045
Epoch 81/200, Loss: 0.030760986235691234
0.73369513799308
Epoch 91/200, Loss: 0.028947629762114957
0.7278463105354451
Epoch 101/200, Loss: 0.02821043468429707
0.7311779545681312
Epoch 111/200, Loss: 0.026847401459235698
0.7329627957529848
Epoch 121/200, Loss: 0.026184140209807083
0.7229092536165633
Epoch 131/200, Loss: 0.02620668729650788
0.7305552038277396
Epoch 141/200, Loss: 0.0251615532906726
0.7197334019934789
Epoch 151/200, Loss: 0.024244270200142637
0.7283110303668004
Epoch 161/200, Loss: 0.024176608450943604
0.723924

[I 2024-01-19 14:30:30,924] Trial 15 finished with value: 0.7355854042614565 and parameters: {'hidden_dim_h': 31, 'dropout': 0.14335983973468389, 'batch_size': 313}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.6814518313150149
0.6019088601499393
Epoch 11/200, Loss: 0.27084045998148015
0.631075135803626
Epoch 21/200, Loss: 0.18531926056823214
0.7154693775833909
Epoch 31/200, Loss: 0.1597501655688157
0.7307344072285327
Epoch 41/200, Loss: 0.13509770744555705
0.727249408941607
Epoch 51/200, Loss: 0.11131662815003782
0.7334647836041842
Epoch 61/200, Loss: 0.0899912179321856
0.7349446975969899
Epoch 71/200, Loss: 0.07099755793004422
0.7309289723431696
Epoch 81/200, Loss: 0.0561418396395606
0.7285233560881729
Epoch 91/200, Loss: 0.043954200941968606
0.7301660927516908
Epoch 101/200, Loss: 0.036010155202569186
0.7266077225195477
Epoch 111/200, Loss: 0.030322879452157666
0.7312223511315713
Epoch 121/200, Loss: 0.02689521503005479
0.7340437261352708
Epoch 131/200, Loss: 0.024314425633968535
0.7226017020179486
Epoch 141/200, Loss: 0.02256383918024398
0.7232499918986163
Epoch 151/200, Loss: 0.021944974775652628
0.7276783062362067
Epoch 161/200, Loss: 0.021392363048083073
0.72089946

[I 2024-01-19 14:31:30,392] Trial 16 finished with value: 0.7349446975969899 and parameters: {'hidden_dim_h': 23, 'dropout': 0.06228746515220718, 'batch_size': 544}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 1.6002012491226196
0.5588525568779651
Epoch 11/200, Loss: 0.8903813600540161
0.6437255910250311
Epoch 21/200, Loss: 0.5092254543304443
0.6919152679841046
Epoch 31/200, Loss: 0.3255336344242096
0.7124033271161577
Epoch 41/200, Loss: 0.2490030550956726
0.7170603550809344
Epoch 51/200, Loss: 0.2173779535293579
0.7202781649174417
Epoch 61/200, Loss: 0.2012835645675659
0.7203683129228297
Epoch 71/200, Loss: 0.18768038213253022
0.720931754484135
Epoch 81/200, Loss: 0.17389803767204284
0.7233009131184338
Epoch 91/200, Loss: 0.16016745150089265
0.7260153253055522
Epoch 101/200, Loss: 0.14573100566864014
0.7245817181618954
Epoch 111/200, Loss: 0.13096041917800905
0.7258075880932808
Epoch 121/200, Loss: 0.1172572910785675
0.7227070417002066
Epoch 131/200, Loss: 0.10361613631248474
0.7244340855153251
Epoch 141/200, Loss: 0.09111753582954407
0.7243456044546257
Epoch 151/200, Loss: 0.07972336530685425
0.7262696147515193
Epoch 161/200, Loss: 0.06957907319068908
0.7209991012794622


[I 2024-01-19 14:32:30,947] Trial 17 finished with value: 0.726393071897396 and parameters: {'hidden_dim_h': 32, 'dropout': 0.3164622732534086, 'batch_size': 812}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 1.4331243787493024
0.5752234913830003
Epoch 11/200, Loss: 0.558495386157717
0.6495498838316225
Epoch 21/200, Loss: 0.21071348871503556
0.6988714454585664
Epoch 31/200, Loss: 0.10518056814159665
0.7143733307729496
Epoch 41/200, Loss: 0.08147251712424415
0.7243332446181079
Epoch 51/200, Loss: 0.07512827430452619
0.7343995563510038
Epoch 61/200, Loss: 0.07125852203794888
0.7358068645814481
Epoch 71/200, Loss: 0.06761423189725195
0.7310333118117609
Epoch 81/200, Loss: 0.0637014525277274
0.7319754383513103
Epoch 91/200, Loss: 0.06033490215029035
0.7343105983487189
Epoch 101/200, Loss: 0.05730347793017115
0.7331125544148221
Epoch 111/200, Loss: 0.054605003339903695
0.7286944665258118
Epoch 121/200, Loss: 0.05195681612406458
0.7284669437501985
Epoch 131/200, Loss: 0.04958813477839742
0.7229089491226087
Epoch 141/200, Loss: 0.04759409949183464
0.7286898330494699
Epoch 151/200, Loss: 0.04605661364538329
0.7318397011237742
Epoch 161/200, Loss: 0.04531331977673939
0.72954686093

[I 2024-01-19 14:33:27,533] Trial 18 finished with value: 0.7358068645814481 and parameters: {'hidden_dim_h': 17, 'dropout': 0.26645661354211075, 'batch_size': 577}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 3.0768301136353435
0.512041355543099
Epoch 11/200, Loss: 0.9877951951587901
0.6666327073775958
Epoch 21/200, Loss: 0.264125329825808
0.6754373410418135
Epoch 31/200, Loss: 0.15203134277287653
0.7107280966928631
Epoch 41/200, Loss: 0.13005048080402262
0.718909434603463
Epoch 51/200, Loss: 0.11095641005565138
0.7226823395128016
Epoch 61/200, Loss: 0.09153686989756192
0.7356833864240848
Epoch 71/200, Loss: 0.07334742749876835
0.7331050212953124
Epoch 81/200, Loss: 0.058489124948049295
0.7313336116486383
Epoch 91/200, Loss: 0.04749328922480345
0.7378390471083195
Epoch 101/200, Loss: 0.041771806420429665
0.7355324979064779
Epoch 111/200, Loss: 0.03801291548263501
0.7346551689133126
Epoch 121/200, Loss: 0.03626800303840462
0.7337482646603464
Epoch 131/200, Loss: 0.035623260499799955
0.7388618508385232
Epoch 141/200, Loss: 0.03473226572660839
0.7338733831118455
Epoch 151/200, Loss: 0.03349831363405375
0.7264083645334998
Epoch 161/200, Loss: 0.03218903187114526
0.73082302921

[I 2024-01-19 14:34:40,766] Trial 19 finished with value: 0.7388618508385232 and parameters: {'hidden_dim_h': 26, 'dropout': 0.20662270391779824, 'batch_size': 297}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.16387442818709783
0.6302302676610089
Epoch 11/200, Loss: 0.10592249319666908
0.7133900796235844
Epoch 21/200, Loss: 0.08799043546120326
0.7235803056696669
Epoch 31/200, Loss: 0.07344996361505418
0.741231538407412
Epoch 41/200, Loss: 0.06117783309448333
0.7289791190060996
Epoch 51/200, Loss: 0.05284505035905611
0.7277396061301731
Epoch 61/200, Loss: 0.04545052047996294
0.7252168470049326
Epoch 71/200, Loss: 0.040686125379233135
0.7250487093265178
Epoch 81/200, Loss: 0.0368921034747646
0.7202340356855508
Epoch 91/200, Loss: 0.03498831480031922
0.7177957898135844
Epoch 101/200, Loss: 0.03274492573525224
0.7254267427630826
Epoch 111/200, Loss: 0.030858849663110005
0.7256943718269155
Epoch 121/200, Loss: 0.02978671643705595
0.7194017947715226
Epoch 131/200, Loss: 0.02813970608015855
0.7166615992833894
Epoch 141/200, Loss: 0.027292825902501743
0.7215072094786629
Epoch 151/200, Loss: 0.026967346668243408
0.7179773364755608
Epoch 161/200, Loss: 0.026986812019631976
0.72614

[I 2024-01-19 14:35:52,025] Trial 20 finished with value: 0.741231538407412 and parameters: {'hidden_dim_h': 43, 'dropout': 0.22080297739354032, 'batch_size': 985}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.24580534332328371
0.6284813933845009
Epoch 11/200, Loss: 0.15678537487983704
0.6985236379651729
Epoch 21/200, Loss: 0.10597613354523977
0.7237135401443919
Epoch 31/200, Loss: 0.0769639597998725
0.7286066467561284
Epoch 41/200, Loss: 0.06023604778779878
0.7308040407644408
Epoch 51/200, Loss: 0.0508885506954458
0.718153269831439
Epoch 61/200, Loss: 0.04661951760450999
0.720389136657471
Epoch 71/200, Loss: 0.04390826415684488
0.7248662113870616
Epoch 81/200, Loss: 0.04084981406728427
0.7245090132282224
Epoch 91/200, Loss: 0.03988048889570766
0.7251322391436805
Epoch 101/200, Loss: 0.03804880181948344
0.7240257701699967
Epoch 111/200, Loss: 0.03758014821343952
0.7193909108428392
Epoch 121/200, Loss: 0.036572492205434376
0.7218572295095029
Epoch 131/200, Loss: 0.03576346325377623
0.7237215371879863
Epoch 141/200, Loss: 0.03449902637965149
0.7178701056223278
Epoch 151/200, Loss: 0.033712906017899516
0.7164150366859263
Epoch 161/200, Loss: 0.03303496270543999
0.7208934406

[I 2024-01-19 14:37:01,847] Trial 21 finished with value: 0.7308040407644408 and parameters: {'hidden_dim_h': 35, 'dropout': 0.3211780192676232, 'batch_size': 445}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.26681016232722843
0.6341535462158467
Epoch 11/200, Loss: 0.1884175283022416
0.6833916478409571
Epoch 21/200, Loss: 0.14167011968600443
0.7083819636181466
Epoch 31/200, Loss: 0.10905714504993878
0.7100390175625725
Epoch 41/200, Loss: 0.08830976906495216
0.7159966611608144
Epoch 51/200, Loss: 0.07245056312053631
0.7280090629379312
Epoch 61/200, Loss: 0.06403698944128476
0.7243213088283365
Epoch 71/200, Loss: 0.05810314531509693
0.7297390787212972
Epoch 81/200, Loss: 0.0534700388327623
0.7369275326282454
Epoch 91/200, Loss: 0.05202736399876766
0.7336521372152686
Epoch 101/200, Loss: 0.04811307491782384
0.7289657162262574
Epoch 111/200, Loss: 0.04782573859661053
0.7330636984791413
Epoch 121/200, Loss: 0.046222129120276526
0.7266306524173982
Epoch 131/200, Loss: 0.046081047791701094
0.7353242906117642
Epoch 141/200, Loss: 0.04813749811206108
0.7350982922714326
Epoch 151/200, Loss: 0.041967607222688504
0.7345310998337926
Epoch 161/200, Loss: 0.0439783017604779
0.73295715

[I 2024-01-19 14:38:23,150] Trial 22 finished with value: 0.7369275326282454 and parameters: {'hidden_dim_h': 50, 'dropout': 0.2765043764487713, 'batch_size': 526}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.2752387424310048
0.62556379352467
Epoch 11/200, Loss: 0.20999769314571662
0.6988177828574836
Epoch 21/200, Loss: 0.16090361884346716
0.7117893719218973
Epoch 31/200, Loss: 0.12476323407005381
0.7242637734142007
Epoch 41/200, Loss: 0.09824154801942685
0.7254417870290503
Epoch 51/200, Loss: 0.07849483523103926
0.7238852054188092
Epoch 61/200, Loss: 0.06455231140609141
0.7282499614418284
Epoch 71/200, Loss: 0.054294107688797846
0.7289912468222595
Epoch 81/200, Loss: 0.048416409779478004
0.721183317331554
Epoch 91/200, Loss: 0.04322515855784769
0.7234704532548375
Epoch 101/200, Loss: 0.04048748038433216
0.7254422460654595
Epoch 111/200, Loss: 0.03867527856319039
0.7175545342673716
Epoch 121/200, Loss: 0.036867733768842836
0.71731436281781
Epoch 131/200, Loss: 0.035762184885916884
0.7166302148377943
Epoch 141/200, Loss: 0.034065547571689996
0.7159037603669997
Epoch 151/200, Loss: 0.03453264585523694
0.7196327173132845
Epoch 161/200, Loss: 0.032800096121651155
0.72003900

[I 2024-01-19 14:39:34,076] Trial 23 finished with value: 0.7289912468222595 and parameters: {'hidden_dim_h': 41, 'dropout': 0.34553396455786634, 'batch_size': 763}. Best is trial 11 with value: 0.7427472413365445.


Epoch 1/200, Loss: 0.14771726699890914
0.6365259437063518
Epoch 11/200, Loss: 0.08886873708279044
0.7173446446911917
Epoch 21/200, Loss: 0.06756766913113771
0.7294632529131385
Epoch 31/200, Loss: 0.055138620306496265
0.7350449752841036
Epoch 41/200, Loss: 0.04884749264628799
0.7437495589054155
Epoch 51/200, Loss: 0.04379001701319659
0.7438960241503889
Epoch 61/200, Loss: 0.04154812289332902
0.7348457581165458
Epoch 71/200, Loss: 0.03880081391306939
0.7374605157147315
Epoch 81/200, Loss: 0.037252738416470865
0.729770639530979
Epoch 91/200, Loss: 0.03517419424045969
0.7301044353742788
Epoch 101/200, Loss: 0.03413703227070747
0.7305496626496987
Epoch 111/200, Loss: 0.03311361251743855
0.7220414504719094
Epoch 121/200, Loss: 0.03215774866165938
0.724929033081322
Epoch 131/200, Loss: 0.03105027811532771
0.7253318731226543
Epoch 141/200, Loss: 0.03014819437844886
0.7197117047364633
Epoch 151/200, Loss: 0.029617987228212534
0.7222446763797319
Epoch 161/200, Loss: 0.028660571237129194
0.723498

[I 2024-01-19 14:40:47,649] Trial 24 finished with value: 0.7438960241503889 and parameters: {'hidden_dim_h': 36, 'dropout': 0.23828991621113252, 'batch_size': 374}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.21876426299256602
0.6271432655062333
Epoch 11/200, Loss: 0.09034509123779658
0.7145429710845521
Epoch 21/200, Loss: 0.05931282483451948
0.7297924618120148
Epoch 31/200, Loss: 0.04983868306194703
0.7390877425109068
Epoch 41/200, Loss: 0.0449416952163685
0.7331497122722028
Epoch 51/200, Loss: 0.041402914524665026
0.731754997633523
Epoch 61/200, Loss: 0.0385075765918559
0.7253906813194448
Epoch 71/200, Loss: 0.036117576972002116
0.7325988526540789
Epoch 81/200, Loss: 0.03450770618936678
0.7306062709158081
Epoch 91/200, Loss: 0.03318472086327282
0.7300917218740032
Epoch 101/200, Loss: 0.03224247937479357
0.7276752408868905
Epoch 111/200, Loss: 0.03126444990240683
0.7294791201854017
Epoch 121/200, Loss: 0.030245629395908257
0.7268198968711667
Epoch 131/200, Loss: 0.029211311549769612
0.726516310092898
Epoch 141/200, Loss: 0.028336667037737653
0.727614206652689
Epoch 151/200, Loss: 0.027990625731236354
0.7338922171048889
Epoch 161/200, Loss: 0.027612656721566604
0.727449

[I 2024-01-19 14:42:28,626] Trial 25 finished with value: 0.7390877425109068 and parameters: {'hidden_dim_h': 34, 'dropout': 0.1730691847470238, 'batch_size': 158}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.7386350463021476
0.5986609782932246
Epoch 11/200, Loss: 0.2195596770857865
0.7096144773578862
Epoch 21/200, Loss: 0.16909999751819754
0.718002209989677
Epoch 31/200, Loss: 0.1393365016523397
0.7266465511253632
Epoch 41/200, Loss: 0.11011632278842746
0.7251474852915643
Epoch 51/200, Loss: 0.08473670707558686
0.7297668515030145
Epoch 61/200, Loss: 0.06553922214035718
0.7328163673689865
Epoch 71/200, Loss: 0.051935734121866944
0.736570895016408
Epoch 81/200, Loss: 0.04362959126537701
0.739596782242816
Epoch 91/200, Loss: 0.03873713026350399
0.737491171770001
Epoch 101/200, Loss: 0.036422045233677015
0.7354062957675386
Epoch 111/200, Loss: 0.034311249114151274
0.7349530719903654
Epoch 121/200, Loss: 0.03356562797331585
0.7301431649766731
Epoch 131/200, Loss: 0.032397929614163795
0.7292617825370389
Epoch 141/200, Loss: 0.03128810339378861
0.7290277701706265
Epoch 151/200, Loss: 0.03070550264333779
0.730669945801626
Epoch 161/200, Loss: 0.02994832512483282
0.727423005180

[I 2024-01-19 14:43:49,058] Trial 26 finished with value: 0.739596782242816 and parameters: {'hidden_dim_h': 46, 'dropout': 0.31348112909681836, 'batch_size': 380}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 1.4203155158478538
0.5484591101490949
Epoch 11/200, Loss: 0.18288773427039018
0.6960057518005689
Epoch 21/200, Loss: 0.09464756923693197
0.720215886955237
Epoch 31/200, Loss: 0.08116245646903544
0.731978623597812
Epoch 41/200, Loss: 0.06907107497071042
0.7301605030554355
Epoch 51/200, Loss: 0.058355791931167064
0.7356975000635897
Epoch 61/200, Loss: 0.04972060222500636
0.7292031110203012
Epoch 71/200, Loss: 0.04493304866331595
0.738552700407911
Epoch 81/200, Loss: 0.04242664189250381
0.7330700297494539
Epoch 91/200, Loss: 0.039593121542790786
0.7286518434385961
Epoch 101/200, Loss: 0.038170325190380765
0.73524651160087
Epoch 111/200, Loss: 0.037716754585688496
0.730818470596757
Epoch 121/200, Loss: 0.03580714497761226
0.7259653749836613
Epoch 131/200, Loss: 0.03472097887209168
0.7341525388296901
Epoch 141/200, Loss: 0.033888453571700755
0.72505976103388
Epoch 151/200, Loss: 0.03317651955157886
0.727567066253984
Epoch 161/200, Loss: 0.03316253607655749
0.7267819482611

[I 2024-01-19 14:45:09,267] Trial 27 finished with value: 0.738552700407911 and parameters: {'hidden_dim_h': 27, 'dropout': 0.24341802372114837, 'batch_size': 249}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.7964697544639175
0.570780120681358
Epoch 11/200, Loss: 0.2323278816970619
0.6786047922653223
Epoch 21/200, Loss: 0.10338687010713525
0.7174217946827353
Epoch 31/200, Loss: 0.08387304077277312
0.7305980078043695
Epoch 41/200, Loss: 0.07749543761884845
0.7384739406146078
Epoch 51/200, Loss: 0.07205347837628545
0.7376382520142644
Epoch 61/200, Loss: 0.06567502756779259
0.739498625026909
Epoch 71/200, Loss: 0.06094237296162425
0.7396809172654687
Epoch 81/200, Loss: 0.05652831434398084
0.7347271567332803
Epoch 91/200, Loss: 0.05257384609934446
0.7315049878154715
Epoch 101/200, Loss: 0.04877478136001406
0.7323664233996954
Epoch 111/200, Loss: 0.046523543527802906
0.7322532797351721
Epoch 121/200, Loss: 0.04498176528392611
0.7309352071636946
Epoch 131/200, Loss: 0.04269682223329673
0.739280146724846
Epoch 141/200, Loss: 0.041562441837143256
0.7331500234735528
Epoch 151/200, Loss: 0.04111735311311644
0.7383786720807384
Epoch 161/200, Loss: 0.039863178959569416
0.7349096662

[I 2024-01-19 14:46:08,119] Trial 28 finished with value: 0.7396809172654687 and parameters: {'hidden_dim_h': 21, 'dropout': 0.2755033118092165, 'batch_size': 549}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.22523878514766693
0.6041201943476164
Epoch 11/200, Loss: 0.17548365245262781
0.6810474666688291
Epoch 21/200, Loss: 0.14269219636917113
0.704716600627921
Epoch 31/200, Loss: 0.11657879451910655
0.7205252462921913
Epoch 41/200, Loss: 0.096745781848828
0.7347095218751742
Epoch 51/200, Loss: 0.08284682755668958
0.7277880255224313
Epoch 61/200, Loss: 0.07266757612427076
0.7300395957213596
Epoch 71/200, Loss: 0.06607707937558492
0.734876072342591
Epoch 81/200, Loss: 0.061725390950838725
0.7362295083902204
Epoch 91/200, Loss: 0.0580105888346831
0.7358907413212732
Epoch 101/200, Loss: 0.05632591694593429
0.7251336370075093
Epoch 111/200, Loss: 0.054809523622194926
0.7310151920677623
Epoch 121/200, Loss: 0.05369650758802891
0.734123435258918
Epoch 131/200, Loss: 0.05272080736855666
0.7353214655353665
Epoch 141/200, Loss: 0.052137560397386554
0.7383781609444775
Epoch 151/200, Loss: 0.05215230956673622
0.7386829727663119
Epoch 161/200, Loss: 0.05009539611637592
0.73393528554

[I 2024-01-19 14:47:01,083] Trial 29 finished with value: 0.7386829727663119 and parameters: {'hidden_dim_h': 16, 'dropout': 0.3284580238115084, 'batch_size': 682}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.23662771391017096
0.6333372128762679
Epoch 11/200, Loss: 0.15927693620324135
0.7122072375506175
Epoch 21/200, Loss: 0.1361727969987052
0.718335081141094
Epoch 31/200, Loss: 0.11453567631542683
0.7273102219111378
Epoch 41/200, Loss: 0.09366774958159242
0.72923312306892
Epoch 51/200, Loss: 0.07893549837172031
0.7240339382057733
Epoch 61/200, Loss: 0.06519720490489687
0.7268222436676527
Epoch 71/200, Loss: 0.05638030224612781
0.7314655392581846
Epoch 81/200, Loss: 0.04950538397367511
0.733184922171355
Epoch 91/200, Loss: 0.043770503252744675
0.7264213948240686
Epoch 101/200, Loss: 0.03956054310713496
0.7353031868996732
Epoch 111/200, Loss: 0.037003843779010434
0.7261668475191103
Epoch 121/200, Loss: 0.03550254773082478
0.7235119445622601
Epoch 131/200, Loss: 0.03368796042299697
0.7258588884429218
Epoch 141/200, Loss: 0.03376472029568894
0.7272333908491714
Epoch 151/200, Loss: 0.03261930189494576
0.73098946464356
Epoch 161/200, Loss: 0.031863088120839426
0.720878103279

[I 2024-01-19 14:48:15,279] Trial 30 finished with value: 0.7353031868996732 and parameters: {'hidden_dim_h': 47, 'dropout': 0.3020226576016949, 'batch_size': 738}. Best is trial 24 with value: 0.7438960241503889.


Epoch 1/200, Loss: 0.5699807330965996
0.5821175705086856
Epoch 11/200, Loss: 0.10164987695004259
0.7155444510175912
Epoch 21/200, Loss: 0.0750570073723793
0.7293833157533661
Epoch 31/200, Loss: 0.0653520413408322
0.7368488956111162
Epoch 41/200, Loss: 0.05705156223848462
0.7442556344812707
Epoch 51/200, Loss: 0.04960363285083856
0.7395905896426521
Epoch 61/200, Loss: 0.04344696631389005
0.7354104067099141
Epoch 71/200, Loss: 0.04005965730175376
0.742530617164623
Epoch 81/200, Loss: 0.037106051741700084
0.7361692858722206
Epoch 91/200, Loss: 0.03502004813136799
0.735160343547715
Epoch 101/200, Loss: 0.03405884636699089
0.7288945202618279
Epoch 111/200, Loss: 0.03300154165896986
0.7407812794456213
Epoch 121/200, Loss: 0.031147567655092905
0.7390833402267383
Epoch 131/200, Loss: 0.0309015751284148
0.7371161314860613
Epoch 141/200, Loss: 0.029612952543954765
0.7326988814149757
Epoch 151/200, Loss: 0.02930227291238095
0.7340400777652286
Epoch 161/200, Loss: 0.02830082065026675
0.73826809664

[I 2024-01-19 14:49:30,992] Trial 31 finished with value: 0.7442556344812707 and parameters: {'hidden_dim_h': 38, 'dropout': 0.2473750225811697, 'batch_size': 359}. Best is trial 31 with value: 0.7442556344812707.


Epoch 1/200, Loss: 0.32587306120178916
0.6176799097610008


[I 2024-01-19 14:49:32,134] Trial 32 finished with value: 0.6176799097610008 and parameters: {'hidden_dim_h': 29, 'dropout': 0.2241343556565365, 'batch_size': 369}. Best is trial 31 with value: 0.7442556344812707.
[W 2024-01-19 14:49:32,297] Trial 33 failed with parameters: {'hidden_dim_h': 34, 'dropout': 0.2641535390871006, 'batch_size': 157} because of the following error: ValueError('zero-size array to reduction operation maximum which has no identity').
Traceback (most recent call last):
  File "/home/juannanzhou/.local/lib/python3.10/site-packages/optuna/study/_optimize.py", line 200, in _run_trial
    value_or_values = func(trial)
  File "/scratch/local/21743416/ipykernel_2182428/1032276540.py", line 55, in objective
    return np.array(r2_test).max()
  File "/apps/pytorch/2.0.1/lib/python3.10/site-packages/numpy/core/_methods.py", line 41, in _amax
    return umr_maximum(a, axis, None, out, keepdims, initial, where)
ValueError: zero-size array to reduction operation maximum whic

training failed
training failed


ValueError: zero-size array to reduction operation maximum which has no identity

#### 1 layer no softmax

In [124]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 1
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    r2_test.append(pearsonr(pred, true)[0]**2)
    except: print("training failed")
            
    return np.array(r2_test).max()

In [125]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-19 14:49:39,349] A new study created in memory with name: no-name-e9ea7607-87db-4b61-bb7f-9b910311dda2


Epoch 1/200, Loss: 2.369227488835653
0.5885783602266235
Epoch 11/200, Loss: 1.564675041607448
0.5687010547989698
Epoch 21/200, Loss: 0.977824106102898
0.6168301267674828
Epoch 31/200, Loss: 0.6032880856877282
0.6309281972029587
Epoch 41/200, Loss: 0.3756717982746306
0.6369905590905649
Epoch 51/200, Loss: 0.24739797839096614
0.6438527839160176
Epoch 61/200, Loss: 0.18129653802939824
0.6476167126628367
Epoch 71/200, Loss: 0.1501993558236531
0.6520920226010735
Epoch 81/200, Loss: 0.13604776632218135
0.6519373718669332
Epoch 91/200, Loss: 0.13013785367920286
0.653817060791295
Epoch 101/200, Loss: 0.1267480750878652
0.6546581287966964
Epoch 111/200, Loss: 0.12424864797365098
0.6559420070429822
Epoch 121/200, Loss: 0.1218521414058549
0.6538514804182441
Epoch 131/200, Loss: 0.11957856941790808
0.6545754387810171
Epoch 141/200, Loss: 0.11716450679869879
0.6550949513774927
Epoch 151/200, Loss: 0.11444540144432158
0.6554019361019249
Epoch 161/200, Loss: 0.11203344414631526
0.6543597009575278
Epo

[I 2024-01-19 14:50:26,069] Trial 0 finished with value: 0.6569300643465438 and parameters: {'hidden_dim_h': 35, 'dropout': 0.16429546359306352, 'batch_size': 958}. Best is trial 0 with value: 0.6569300643465438.


Epoch 1/200, Loss: 1.3508108568191528
0.5867471119475914
Epoch 11/200, Loss: 0.3634290027618408
0.6393426678173904
Epoch 21/200, Loss: 0.1488633893430233
0.6439030518080032
Epoch 31/200, Loss: 0.12356060236692429
0.6506159114339983
Epoch 41/200, Loss: 0.11774183541536332
0.653085333954796
Epoch 51/200, Loss: 0.11244198441505432
0.6488151625660766
Epoch 61/200, Loss: 0.1074792255461216
0.653848549132271
Epoch 71/200, Loss: 0.10220815017819404
0.6553455198061154
Epoch 81/200, Loss: 0.09737571537494659
0.6580990886609247
Epoch 91/200, Loss: 0.0943614438176155
0.6545580959683471
Epoch 101/200, Loss: 0.0915521351993084
0.6579591520313618
Epoch 111/200, Loss: 0.09116977363824845
0.6538200491614158
Epoch 121/200, Loss: 0.09040695652365685
0.658195318389405
Epoch 131/200, Loss: 0.09013764068484306
0.6572401763979355
Epoch 141/200, Loss: 0.08965965062379837
0.6551434089551754
Epoch 151/200, Loss: 0.09011358395218849
0.6546847940921997
Epoch 161/200, Loss: 0.0901513685286045
0.6582544641019343
E

[I 2024-01-19 14:51:18,302] Trial 1 finished with value: 0.659444386521454 and parameters: {'hidden_dim_h': 40, 'dropout': 0.3296206513523845, 'batch_size': 404}. Best is trial 1 with value: 0.659444386521454.


Epoch 1/200, Loss: 2.439992588619853
0.5633464654157084
Epoch 11/200, Loss: 1.1109332137329633
0.6193966457502362
Epoch 21/200, Loss: 0.4722847127637198
0.5970825665400014
Epoch 31/200, Loss: 0.2264272587936978
0.6405522286823616
Epoch 41/200, Loss: 0.17042668544968895
0.6514475887797552
Epoch 51/200, Loss: 0.1579129609257676
0.6490259707720811
Epoch 61/200, Loss: 0.1485642763071282
0.6554419805279107
Epoch 71/200, Loss: 0.1396552740141403
0.6533411134355016
Epoch 81/200, Loss: 0.1301012461961702
0.6542156413370448
Epoch 91/200, Loss: 0.12153423075066057
0.6563612868768506
Epoch 101/200, Loss: 0.11271103367555974
0.6536957144583775
Epoch 111/200, Loss: 0.10531379213166792
0.6528712006841446
Epoch 121/200, Loss: 0.10016940967288128
0.6551325005595714
Epoch 131/200, Loss: 0.09491064711365589
0.6561604719452235
Epoch 141/200, Loss: 0.0925268700649572
0.6541962982501174
Epoch 151/200, Loss: 0.09080214313296385
0.6563383169035708
Epoch 161/200, Loss: 0.0895228472559951
0.6572797201357444
Ep

[I 2024-01-19 14:52:06,394] Trial 2 finished with value: 0.6595504287168961 and parameters: {'hidden_dim_h': 28, 'dropout': 0.1954013216551589, 'batch_size': 475}. Best is trial 2 with value: 0.6595504287168961.


Epoch 1/200, Loss: 1.9812895266906074
0.5917684489583411
Epoch 11/200, Loss: 1.2646831118542214
0.6169350996122588
Epoch 21/200, Loss: 0.7292372428852579
0.6143779198085487
Epoch 31/200, Loss: 0.42008136407188745
0.6362823974679161
Epoch 41/200, Loss: 0.2626257370347562
0.6437470482470778
Epoch 51/200, Loss: 0.19012321920498557
0.6460772418235327
Epoch 61/200, Loss: 0.16158765360065128
0.6534169366209734
Epoch 71/200, Loss: 0.14987593241359876
0.6495578704414389
Epoch 81/200, Loss: 0.14415694902772488
0.6486832285977737
Epoch 91/200, Loss: 0.14031280965908713
0.6553806283675951
Epoch 101/200, Loss: 0.13606900559819263
0.6524651022664232
Epoch 111/200, Loss: 0.13157816749552023
0.6546850644701321
Epoch 121/200, Loss: 0.12745315905498422
0.6532025398383148
Epoch 131/200, Loss: 0.12371836473112521
0.6568092461926679
Epoch 141/200, Loss: 0.11928017793790154
0.6557874290566029
Epoch 151/200, Loss: 0.11569922320220781
0.6543165340089232
Epoch 161/200, Loss: 0.11169698672450107
0.655270927790

[I 2024-01-19 14:52:53,888] Trial 3 finished with value: 0.6568092461926679 and parameters: {'hidden_dim_h': 40, 'dropout': 0.12056321305751974, 'batch_size': 894}. Best is trial 2 with value: 0.6595504287168961.


Epoch 1/200, Loss: 0.2939497326549731
0.5996361738821986
Epoch 11/200, Loss: 0.2064236092724298
0.6484621386036994
Epoch 21/200, Loss: 0.16039171658064189
0.6505177284176688
Epoch 31/200, Loss: 0.12932678861053368
0.6455223218549004
Epoch 41/200, Loss: 0.11034052191596282
0.6552102110052853
Epoch 51/200, Loss: 0.0991364688073334
0.6542957489958434
Epoch 61/200, Loss: 0.09378120538435485
0.6547853887356652
Epoch 71/200, Loss: 0.09108250960707664
0.6584900613147276
Epoch 81/200, Loss: 0.09033709842907756
0.652783731109494
Epoch 91/200, Loss: 0.09026499229826425
0.6560423301671356
Epoch 101/200, Loss: 0.08998384503157515
0.6556499244356733
Epoch 111/200, Loss: 0.08985354967023197
0.6557965552301791
Epoch 121/200, Loss: 0.08934157165257554
0.6572603037116908
Epoch 131/200, Loss: 0.08938198183712207
0.6597723705946728
Epoch 141/200, Loss: 0.08955498725960129
0.6584986554696823
Epoch 151/200, Loss: 0.0894565119555122
0.65889765767304
Epoch 161/200, Loss: 0.08985300734639168
0.657858000599243

[I 2024-01-19 14:53:40,225] Trial 4 finished with value: 0.6597723705946728 and parameters: {'hidden_dim_h': 27, 'dropout': 0.30708668201941497, 'batch_size': 533}. Best is trial 4 with value: 0.6597723705946728.


Epoch 1/200, Loss: 0.28945801908319646
0.6141998199265287
Epoch 11/200, Loss: 0.18642270429567856
0.6471112596139877
Epoch 21/200, Loss: 0.14882198517972772
0.6456119329495549
Epoch 31/200, Loss: 0.12144768644462932
0.651883561913838
Epoch 41/200, Loss: 0.10403930707411332
0.6532233062944487
Epoch 51/200, Loss: 0.09535591344941746
0.658475201864976
Epoch 61/200, Loss: 0.09157433618198742
0.6553296687536906
Epoch 71/200, Loss: 0.08989497219974345
0.6549879577207091
Epoch 81/200, Loss: 0.08962955501946536
0.6566204085067144
Epoch 91/200, Loss: 0.08916650861501693
0.6573254811573482
Epoch 101/200, Loss: 0.08968093598430807
0.651791619186125
Epoch 111/200, Loss: 0.08880085714838722
0.6588992918374932
Epoch 121/200, Loss: 0.08858285654674877
0.65644255469739
Epoch 131/200, Loss: 0.08906043591824445
0.6588434427973199
Epoch 141/200, Loss: 0.08880654492161491
0.6581141495331279
Epoch 151/200, Loss: 0.08921031193299726
0.6582067512074101
Epoch 161/200, Loss: 0.08853787874633616
0.6588499144043

[I 2024-01-19 14:54:37,519] Trial 5 finished with value: 0.6588992918374932 and parameters: {'hidden_dim_h': 48, 'dropout': 0.20438399666208834, 'batch_size': 368}. Best is trial 4 with value: 0.6597723705946728.


Epoch 1/200, Loss: 1.1093344952239366
0.5474788444920149
Epoch 11/200, Loss: 0.23955463703538551
0.6397742390164094
Epoch 21/200, Loss: 0.15785904228687286
0.6523861368568751
Epoch 31/200, Loss: 0.14386111974227625
0.6543107413789914
Epoch 41/200, Loss: 0.12964930812843511
0.6495706791633583
Epoch 51/200, Loss: 0.1166001105161964
0.6555248796975738
Epoch 61/200, Loss: 0.10563346792439945
0.655669048331795
Epoch 71/200, Loss: 0.09802021709133367
0.6562339503975998
Epoch 81/200, Loss: 0.09359061351565064
0.6567369848540838
Epoch 91/200, Loss: 0.09165903388476762
0.653741167671175
Epoch 101/200, Loss: 0.09085360291551371
0.6571176952553694
Epoch 111/200, Loss: 0.09042423719265422
0.6561177459833345
Epoch 121/200, Loss: 0.08999990110026031
0.6599845525351876
Epoch 131/200, Loss: 0.08992394426318466
0.6569820692303922
Epoch 141/200, Loss: 0.09002356292282948
0.6574591382955307
Epoch 151/200, Loss: 0.08997851255975786
0.6556671079186621
Epoch 161/200, Loss: 0.08954089293714429
0.656906320545

[I 2024-01-19 14:55:34,059] Trial 6 finished with value: 0.6599845525351876 and parameters: {'hidden_dim_h': 37, 'dropout': 0.3351804762010545, 'batch_size': 331}. Best is trial 6 with value: 0.6599845525351876.


Epoch 1/200, Loss: 1.708720171773756
0.5799306103630549
Epoch 11/200, Loss: 0.7636394114107699
0.6212377814679254
Epoch 21/200, Loss: 0.388437732651427
0.641674778363287
Epoch 31/200, Loss: 0.27754357336340724
0.6491150438221628
Epoch 41/200, Loss: 0.24621394236345548
0.6489587416667063
Epoch 51/200, Loss: 0.2269613565625371
0.6489488675186578
Epoch 61/200, Loss: 0.20824859633639053
0.6461875761996937
Epoch 71/200, Loss: 0.18943619285080884
0.6474832893707687
Epoch 81/200, Loss: 0.17113380939573855
0.6503493588834931
Epoch 91/200, Loss: 0.15346976389756073
0.6514503336149832
Epoch 101/200, Loss: 0.13765067063473366
0.6503820023865274
Epoch 111/200, Loss: 0.12446656621791222
0.6497270912974795
Epoch 121/200, Loss: 0.11345138441066484
0.651154133655738
Epoch 131/200, Loss: 0.1041939816362149
0.6527587393658072
Epoch 141/200, Loss: 0.09798914878755002
0.6554786901381401
Epoch 151/200, Loss: 0.09323381773523383
0.6533147058106554
Epoch 161/200, Loss: 0.09119203988764737
0.6555101188467807


[I 2024-01-19 14:56:26,246] Trial 7 finished with value: 0.6602838188368743 and parameters: {'hidden_dim_h': 43, 'dropout': 0.21338253615076058, 'batch_size': 553}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.6637808322906494
0.5849011698205162
Epoch 11/200, Loss: 0.3155470982193947
0.6370262965301793
Epoch 21/200, Loss: 0.17151401340961456
0.6466869947210614
Epoch 31/200, Loss: 0.12026553973555565
0.6483762174301616
Epoch 41/200, Loss: 0.1060929823666811
0.656171972493487
Epoch 51/200, Loss: 0.10241408534348011
0.6542789965821839
Epoch 61/200, Loss: 0.10100063309073448
0.6567567097664578
Epoch 71/200, Loss: 0.09999779351055622
0.6567650351708494
Epoch 81/200, Loss: 0.09863491468131542
0.6586520269817903
Epoch 91/200, Loss: 0.0977169219404459
0.6561349205322402
Epoch 101/200, Loss: 0.09639056771993637
0.657889913875948
Epoch 111/200, Loss: 0.09515296779572964
0.6563447470813353
Epoch 121/200, Loss: 0.09422618001699448
0.6592524435487355
Epoch 131/200, Loss: 0.0930606558918953
0.6565010172756166
Epoch 141/200, Loss: 0.09204991832375527
0.656333480779873
Epoch 151/200, Loss: 0.09185789152979851
0.6581904081519457
Epoch 161/200, Loss: 0.09071983061730862
0.656208168563685


[I 2024-01-19 14:57:08,689] Trial 8 finished with value: 0.6595846586054682 and parameters: {'hidden_dim_h': 25, 'dropout': 0.23955763303589, 'batch_size': 1014}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.37529170337845297
0.5767869852475627
Epoch 11/200, Loss: 0.26088176755344167
0.6458263917177726
Epoch 21/200, Loss: 0.231622593367801
0.6519378240434446
Epoch 31/200, Loss: 0.21256912631147049
0.6499337092315557
Epoch 41/200, Loss: 0.1940565345918431
0.6517262836717808
Epoch 51/200, Loss: 0.1767884396454867
0.6509806414806939
Epoch 61/200, Loss: 0.1610286419882494
0.6533212438908022
Epoch 71/200, Loss: 0.14710022158482494
0.6545463685123932
Epoch 81/200, Loss: 0.13533532093552983
0.6542634433149966
Epoch 91/200, Loss: 0.12512302048066082
0.6551511048334431
Epoch 101/200, Loss: 0.11662756651639938
0.6568305387011432
Epoch 111/200, Loss: 0.10976572422420278
0.654380474990945
Epoch 121/200, Loss: 0.10416612423518125
0.6567454584457478
Epoch 131/200, Loss: 0.09979298360207502
0.6570596984131359
Epoch 141/200, Loss: 0.0961013773784918
0.6577882437823424
Epoch 151/200, Loss: 0.09420319471289129
0.658409046484316
Epoch 161/200, Loss: 0.09223373146618113
0.6575426719765173

[I 2024-01-19 14:57:49,191] Trial 9 finished with value: 0.6591485985364469 and parameters: {'hidden_dim_h': 16, 'dropout': 0.21911939250207324, 'batch_size': 1179}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.9587144524086523
0.6001913605282498
Epoch 11/200, Loss: 0.11245922112965402
0.6522048545240788
Epoch 21/200, Loss: 0.10194655155180064
0.6511862348074283
Epoch 31/200, Loss: 0.09409754819997394
0.653419178088022
Epoch 41/200, Loss: 0.09060456330767115
0.6540344566241102
Epoch 51/200, Loss: 0.09021140748762903
0.6546605296919761
Epoch 61/200, Loss: 0.08960247864477507
0.6569205853070674
Epoch 71/200, Loss: 0.08959276752390025
0.6574332093119692
Epoch 81/200, Loss: 0.08967118636342405
0.6550827508834016
Epoch 91/200, Loss: 0.08896942959941981
0.6577774188816735
Epoch 101/200, Loss: 0.08914860810032328
0.6567728810623715
Epoch 111/200, Loss: 0.08917139280047126
0.6565472992084247
Epoch 121/200, Loss: 0.08940325108648256
0.6571136947694959
Epoch 131/200, Loss: 0.08909278980079498
0.6578197240287548
Epoch 141/200, Loss: 0.08898794616906698
0.6578497254732192
Epoch 151/200, Loss: 0.08893002308052005
0.6592293301382549
Epoch 161/200, Loss: 0.08913855925771116
0.6587882618

[I 2024-01-19 14:59:09,162] Trial 10 finished with value: 0.6592293301382549 and parameters: {'hidden_dim_h': 46, 'dropout': 0.07421443112290799, 'batch_size': 153}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.8801089326540629
0.5996849939452785
Epoch 11/200, Loss: 0.3319408009449641
0.6313575738003774
Epoch 21/200, Loss: 0.15147522687911988
0.6477135379962227
Epoch 31/200, Loss: 0.10913975064953169
0.6500295276452335
Epoch 61/200, Loss: 0.0985019974410534
0.6564704553679207
Epoch 71/200, Loss: 0.09751051068305969
0.6566523595655932
Epoch 81/200, Loss: 0.0960802378753821
0.6578888346528698
Epoch 91/200, Loss: 0.09467260614037513
0.6560098348057127
Epoch 101/200, Loss: 0.09357148135701815
0.657616917787771
Epoch 111/200, Loss: 0.09231359288096427
0.6562434498297157
Epoch 121/200, Loss: 0.09130457316835722
0.6555804528438106
Epoch 131/200, Loss: 0.09011902486284575
0.6564071121289058
Epoch 141/200, Loss: 0.09021263296405474
0.6555832418743249
Epoch 151/200, Loss: 0.09003721550107002
0.6583553218159536
Epoch 161/200, Loss: 0.08946536059180896
0.6587047519086459
Epoch 171/200, Loss: 0.08945463200410207
0.6587876813581326
Epoch 181/200, Loss: 0.0893090474108855
0.657428151120

[I 2024-01-19 14:59:56,525] Trial 11 finished with value: 0.6592066681291998 and parameters: {'hidden_dim_h': 37, 'dropout': 0.2785921642575598, 'batch_size': 677}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.32277381526572363
0.6151321212372893
Epoch 11/200, Loss: 0.17606387996957415
0.6390112884744996
Epoch 21/200, Loss: 0.11834486094968659
0.6498110969061731
Epoch 31/200, Loss: 0.09698099598643325
0.6539464470067157
Epoch 41/200, Loss: 0.09140317124270257
0.656825513798008
Epoch 51/200, Loss: 0.09150332301145508
0.6564165662408417
Epoch 61/200, Loss: 0.09026405632141091
0.6543119434227553
Epoch 71/200, Loss: 0.09031373909896329
0.6551365424227774
Epoch 81/200, Loss: 0.09005504278909593
0.6567728126595204
Epoch 91/200, Loss: 0.08993524233145374
0.6571338254505438
Epoch 101/200, Loss: 0.09007092547558603
0.6575277282910275
Epoch 111/200, Loss: 0.08972701731891859
0.6563632838640262
Epoch 121/200, Loss: 0.08942345308051222
0.6559361092239987
Epoch 131/200, Loss: 0.08939132777353127
0.6567408698256666
Epoch 141/200, Loss: 0.0898822761539902
0.657801258911704
Epoch 151/200, Loss: 0.09024400423680033
0.6552113281269678
Epoch 161/200, Loss: 0.0899850380207811
0.655398027527

[I 2024-01-19 15:01:02,923] Trial 12 finished with value: 0.657801258911704 and parameters: {'hidden_dim_h': 44, 'dropout': 0.2646315392063766, 'batch_size': 240}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 1.082716464996338
0.5947543832777207
Epoch 11/200, Loss: 0.5105906245963914
0.6320081014006153
Epoch 21/200, Loss: 0.2907940298318863
0.6437918940849654
Epoch 31/200, Loss: 0.21641811302730016
0.6480624793700582
Epoch 41/200, Loss: 0.1984792985022068
0.652694307521564
Epoch 51/200, Loss: 0.184555250619139
0.6505950044418508
Epoch 61/200, Loss: 0.17380711063742638
0.6517844980007627
Epoch 71/200, Loss: 0.16322444964732444
0.6519334090346107
Epoch 81/200, Loss: 0.15268492006829806
0.652889009494542
Epoch 91/200, Loss: 0.14171841687389783
0.6510313822563268
Epoch 101/200, Loss: 0.13264704602105276
0.6526768746431842
Epoch 111/200, Loss: 0.12228912301361561
0.651967284232957
Epoch 121/200, Loss: 0.11428511781351906
0.6530905705559606
Epoch 131/200, Loss: 0.10865518743438381
0.6529902648686082
Epoch 141/200, Loss: 0.10392468262995992
0.653467649680814
Epoch 151/200, Loss: 0.09796461276710033
0.6564272637484204
Epoch 161/200, Loss: 0.0956858436443976
0.6552108189654843
Epo

[I 2024-01-19 15:01:49,961] Trial 13 finished with value: 0.6576568964171344 and parameters: {'hidden_dim_h': 34, 'dropout': 0.33756016942545597, 'batch_size': 739}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.8509643492491349
0.6053644318172806
Epoch 11/200, Loss: 0.268369284444961
0.5818316741478654
Epoch 21/200, Loss: 0.1932615119477977
0.6467350753377402
Epoch 31/200, Loss: 0.1590725796810095
0.6484255716925651
Epoch 41/200, Loss: 0.1294402651812719
0.6519068731395169
Epoch 51/200, Loss: 0.10797964079656462
0.6524082737994321
Epoch 61/200, Loss: 0.09689121887735698
0.6580861314371116
Epoch 71/200, Loss: 0.09149479045384172
0.6570880694488105
Epoch 81/200, Loss: 0.08979469041029613
0.657439662372445
Epoch 91/200, Loss: 0.08946495935104895
0.654903459565741
Epoch 101/200, Loss: 0.088868691869404
0.6556916043778008
Epoch 111/200, Loss: 0.08916173076284105
0.6555081912741245
Epoch 121/200, Loss: 0.08927025214053583
0.6577824204272674
Epoch 131/200, Loss: 0.08907132822534312
0.6551927045650785
Epoch 141/200, Loss: 0.08892910085294557
0.6569729716425721
Epoch 151/200, Loss: 0.0885902555740398
0.6587164098196335
Epoch 161/200, Loss: 0.08880887774453647
0.6592109154415835
Ep

[I 2024-01-19 15:02:54,250] Trial 14 finished with value: 0.6592109154415835 and parameters: {'hidden_dim_h': 50, 'dropout': 0.1547039072013048, 'batch_size': 292}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 1.2009875059127808
0.5807649490119096
Epoch 11/200, Loss: 0.5295601325375693
0.6256154597731336
Epoch 21/200, Loss: 0.31735007337161475
0.6437630848563534
Epoch 31/200, Loss: 0.2648946336337498
0.6471433120164217
Epoch 41/200, Loss: 0.24223071634769439
0.65032182157626
Epoch 51/200, Loss: 0.22151129288332802
0.6518808653831063
Epoch 61/200, Loss: 0.20006644129753112
0.6463625108003744
Epoch 71/200, Loss: 0.17886593469551632
0.6472932199568863
Epoch 81/200, Loss: 0.15947101286479404
0.649908976918247
Epoch 91/200, Loss: 0.14194526374340058
0.6502230083220805
Epoch 101/200, Loss: 0.12735636766467776
0.6528307099821754
Epoch 111/200, Loss: 0.11516765973397664
0.6540282196292055
Epoch 121/200, Loss: 0.10598375690834863
0.6518462023268943
Epoch 131/200, Loss: 0.09960036150046757
0.6559132936802917
Epoch 141/200, Loss: 0.09570048855883735
0.654080951540558
Epoch 151/200, Loss: 0.09256545986448016
0.655313545121298
Epoch 161/200, Loss: 0.09090838836772101
0.657312276169507


[I 2024-01-19 15:03:37,432] Trial 15 finished with value: 0.6586475661273041 and parameters: {'hidden_dim_h': 14, 'dropout': 0.2888563836858838, 'batch_size': 577}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.5098662321214322
0.5962903398388973
Epoch 11/200, Loss: 0.23238389690717062
0.6516818141703584
Epoch 21/200, Loss: 0.17831437620851728
0.6525008914153166
Epoch 31/200, Loss: 0.1643286523995576
0.6506822531786286
Epoch 41/200, Loss: 0.15121184510213356
0.6532454296664982
Epoch 51/200, Loss: 0.13961590854106126
0.653062161482009
Epoch 61/200, Loss: 0.12835617777374056
0.651878534331516
Epoch 71/200, Loss: 0.11872653138858301
0.6561542186958015
Epoch 81/200, Loss: 0.11064545920601597
0.6551673839689323
Epoch 91/200, Loss: 0.10345194571548039
0.6540734373959339
Epoch 101/200, Loss: 0.09828349396034523
0.6538742792073031
Epoch 111/200, Loss: 0.09468063684525313
0.6564714136677898
Epoch 121/200, Loss: 0.09202333512129607
0.6583622079756386
Epoch 131/200, Loss: 0.09058653866803204
0.6560451601873091
Epoch 141/200, Loss: 0.08900608481080444
0.6570653117408645
Epoch 151/200, Loss: 0.0879495397762016
0.6565544485368343
Epoch 161/200, Loss: 0.0884539885101495
0.65787525142251

[I 2024-01-19 15:04:19,302] Trial 16 finished with value: 0.6583622079756386 and parameters: {'hidden_dim_h': 20, 'dropout': 0.06743002289068625, 'batch_size': 758}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.23320218155728303
0.6150759405210122
Epoch 11/200, Loss: 0.1036033455063315
0.6474247336145005
Epoch 21/200, Loss: 0.0924914398375042
0.6586415450694537
Epoch 31/200, Loss: 0.09115697317980828
0.6551746531172097
Epoch 41/200, Loss: 0.09112226572584979
0.6550624121922308
Epoch 51/200, Loss: 0.09083866122811236
0.6506376558756238
Epoch 61/200, Loss: 0.09053206135005874
0.6546911678592036
Epoch 71/200, Loss: 0.09089491193626016
0.6568599808617697
Epoch 81/200, Loss: 0.09028489909627858
0.6584011951082126
Epoch 91/200, Loss: 0.08982640769790838
0.6600809993629342
Epoch 101/200, Loss: 0.09018261806372015
0.6600555162070485
Epoch 111/200, Loss: 0.08983995982590207
0.6574094639348345
Epoch 121/200, Loss: 0.09018570943710638
0.6578995317096413
Epoch 131/200, Loss: 0.09004854209681246
0.6551834237045885
Epoch 141/200, Loss: 0.09048502675113193
0.6562992850659803
Epoch 151/200, Loss: 0.08948641142902528
0.6594221422944303
Epoch 161/200, Loss: 0.089899890782202
0.653787672484

[I 2024-01-19 15:06:01,109] Trial 17 finished with value: 0.6600809993629342 and parameters: {'hidden_dim_h': 42, 'dropout': 0.10793156743886785, 'batch_size': 107}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.4561009428983817
0.6282416676022993
Epoch 11/200, Loss: 0.16468077564349204
0.6365258919574681
Epoch 21/200, Loss: 0.10089948668253203
0.6514476329219671
Epoch 31/200, Loss: 0.09113301473892539
0.6575120560392473
Epoch 41/200, Loss: 0.09038305380867302
0.6527078923674887
Epoch 51/200, Loss: 0.09116794152950948
0.6552115191535658
Epoch 61/200, Loss: 0.0908832587758822
0.6565472426399656
Epoch 71/200, Loss: 0.09024649481374793
0.6589387754481034
Epoch 81/200, Loss: 0.08981372873110274
0.6562650856440897
Epoch 91/200, Loss: 0.08971802186380866
0.6583991553311824
Epoch 101/200, Loss: 0.09027660352412177
0.659696420677218
Epoch 111/200, Loss: 0.09005687074975734
0.6592275883636618
Epoch 121/200, Loss: 0.09005864778179333
0.6593190592568391
Epoch 131/200, Loss: 0.08988146307918192
0.658135718187133
Epoch 141/200, Loss: 0.08953762774361423
0.6582758150169127
Epoch 151/200, Loss: 0.08924492217737473
0.6573974962361175
Epoch 161/200, Loss: 0.08899345925432041
0.659948347838

[I 2024-01-19 15:07:32,744] Trial 18 finished with value: 0.6599483478388104 and parameters: {'hidden_dim_h': 43, 'dropout': 0.11050372066088474, 'batch_size': 123}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 1.9519005219141643
0.5711182799920068
Epoch 11/200, Loss: 0.24888674594381804
0.6379094103939604
Epoch 21/200, Loss: 0.13584718292438855
0.6560547903386487
Epoch 31/200, Loss: 0.12328039149763764
0.6524793089033984
Epoch 41/200, Loss: 0.10981410894022194
0.6508113460094685
Epoch 51/200, Loss: 0.09910089650782206
0.6519217343018353
Epoch 61/200, Loss: 0.09251062107342546
0.6558563929889408
Epoch 71/200, Loss: 0.09047576945315125
0.6527507269122049
Epoch 81/200, Loss: 0.08960947282211755
0.6578579065615503
Epoch 91/200, Loss: 0.0892747821666861
0.6540124714915235
Epoch 101/200, Loss: 0.0893684536298757
0.6580311044253441
Epoch 111/200, Loss: 0.08930877548071646
0.6573846588256893
Epoch 121/200, Loss: 0.08909506102403005
0.6575698496936714
Epoch 131/200, Loss: 0.08896410056660252
0.6560164669107832
Epoch 141/200, Loss: 0.08905396105781678
0.6569301369591072
Epoch 151/200, Loss: 0.08909344825372902
0.6573136613736825
Epoch 161/200, Loss: 0.08939947973015488
0.65704553725

[I 2024-01-19 15:08:34,937] Trial 19 finished with value: 0.658836528862436 and parameters: {'hidden_dim_h': 32, 'dropout': 0.1592116218312928, 'batch_size': 216}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.22867297232151032
0.6071323141361301
Epoch 11/200, Loss: 0.18138809323310853
0.6466579366597188
Epoch 21/200, Loss: 0.15335877656936645
0.6512548284228706
Epoch 31/200, Loss: 0.1319212058186531
0.6542263960338054
Epoch 41/200, Loss: 0.11725990951061249
0.6532864246596304
Epoch 51/200, Loss: 0.1063472232222557
0.6564315230882849
Epoch 61/200, Loss: 0.0988594737648964
0.6478322231576021
Epoch 71/200, Loss: 0.09441527307033538
0.6576005001495867
Epoch 81/200, Loss: 0.09189257591962814
0.6548992488029404
Epoch 91/200, Loss: 0.09001614034175873
0.6576772060036588
Epoch 101/200, Loss: 0.08913122117519379
0.6547880552607636
Epoch 111/200, Loss: 0.08881245344877244
0.6576116348672556
Epoch 121/200, Loss: 0.0881348466873169
0.6578001741530415
Epoch 131/200, Loss: 0.08845301777124405
0.6562775402767652
Epoch 141/200, Loss: 0.08791094839572906
0.6585030305556588
Epoch 151/200, Loss: 0.0881421485543251
0.656363365090823
Epoch 161/200, Loss: 0.08763903081417083
0.65846073909452

[I 2024-01-19 15:09:24,619] Trial 20 finished with value: 0.658600458608129 and parameters: {'hidden_dim_h': 41, 'dropout': 0.1065713338067436, 'batch_size': 822}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.16765324241023952
0.6140027547008617
Epoch 11/200, Loss: 0.11262184684559451
0.6516274969041458
Epoch 21/200, Loss: 0.09678241206427753
0.6541806306549975
Epoch 31/200, Loss: 0.0919335667612189
0.6575951132275576
Epoch 41/200, Loss: 0.09057613399069188
0.6535754670368971
Epoch 51/200, Loss: 0.08995932037547483
0.6553598750976543
Epoch 61/200, Loss: 0.0901401694548332
0.6561873474646761
Epoch 71/200, Loss: 0.08954895414033179
0.6579049340777683
Epoch 81/200, Loss: 0.0898627044033196
0.6569814324881802
Epoch 91/200, Loss: 0.08961735855219728
0.6585999573810197
Epoch 101/200, Loss: 0.08968698233366013
0.6568910790215335
Epoch 111/200, Loss: 0.08953772851471174
0.6598842434356363
Epoch 121/200, Loss: 0.08932653511479749
0.6577076981307753
Epoch 131/200, Loss: 0.08951099141169402
0.6552418948620291
Epoch 141/200, Loss: 0.08914481330726107
0.6579089777003375
Epoch 151/200, Loss: 0.08977296241259171
0.6580284677564424
Epoch 161/200, Loss: 0.089401728015835
0.6579965928138

[I 2024-01-19 15:10:20,308] Trial 21 finished with value: 0.6598842434356363 and parameters: {'hidden_dim_h': 38, 'dropout': 0.23645378875063422, 'batch_size': 342}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 1.1439063574405426
0.5931687329980786
Epoch 11/200, Loss: 0.30865051613209094
0.6381318130552449
Epoch 21/200, Loss: 0.13520282237453662
0.6479116042814086
Epoch 31/200, Loss: 0.11675042738305762
0.650008724872227
Epoch 41/200, Loss: 0.11147779067780109
0.6547814830006625
Epoch 51/200, Loss: 0.1069571187204503
0.655795095697316
Epoch 61/200, Loss: 0.10238220193918715
0.653656878738725
Epoch 71/200, Loss: 0.09880780175011208
0.6549223566856033
Epoch 81/200, Loss: 0.09567656399721795
0.651805582674927
Epoch 91/200, Loss: 0.0927772988030251
0.6578247768834011
Epoch 101/200, Loss: 0.09087883902991072
0.6557225377332714
Epoch 111/200, Loss: 0.08967249602713484
0.656248612022971
Epoch 121/200, Loss: 0.08943344066117673
0.6582174704151519
Epoch 131/200, Loss: 0.08908005550186684
0.6595330758109093
Epoch 141/200, Loss: 0.08914169082616238
0.6593068448889395
Epoch 151/200, Loss: 0.0894785298311964
0.6582644124941683
Epoch 161/200, Loss: 0.08910382634147684
0.6574222642718944


[I 2024-01-19 15:11:14,003] Trial 22 finished with value: 0.6595330758109093 and parameters: {'hidden_dim_h': 45, 'dropout': 0.18435700694732265, 'batch_size': 432}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 1.4348699348655778
0.5912268781784518
Epoch 11/200, Loss: 0.14589167472405648
0.6508252184638442
Epoch 21/200, Loss: 0.11000734050968784
0.6485500437958889
Epoch 31/200, Loss: 0.09418997067452675
0.6503981792827854
Epoch 41/200, Loss: 0.09257899039429636
0.6550719847852505


[I 2024-01-19 15:11:36,355] Trial 23 finished with value: 0.6550719847852505 and parameters: {'hidden_dim_h': 31, 'dropout': 0.05171985648855343, 'batch_size': 101}. Best is trial 7 with value: 0.6602838188368743.


training failed
Epoch 1/200, Loss: 0.24366753101348876
0.6103569111365028
Epoch 11/200, Loss: 0.17674998428140368
0.6418820100744049
Epoch 21/200, Loss: 0.1386731545839991
0.6464692525876687
Epoch 31/200, Loss: 0.12180998112474169
0.6483812415885339
Epoch 41/200, Loss: 0.10985189186675208
0.6518686148838597
Epoch 51/200, Loss: 0.10107479180608477
0.6516729983820464
Epoch 61/200, Loss: 0.10054440328053066
0.6501699876341837


[I 2024-01-19 15:11:53,760] Trial 24 finished with value: 0.6548423161767126 and parameters: {'hidden_dim_h': 37, 'dropout': 0.1340703386398826, 'batch_size': 588}. Best is trial 7 with value: 0.6602838188368743.


Epoch 71/200, Loss: 0.09378707408905029
0.6548423161767126
training failed


[I 2024-01-19 15:11:54,267] Trial 25 finished with value: 0.6186758862462375 and parameters: {'hidden_dim_h': 42, 'dropout': 0.256697055494429, 'batch_size': 248}. Best is trial 7 with value: 0.6602838188368743.


Epoch 1/200, Loss: 0.38913113209936356
0.6186758862462375
training failed


[W 2024-01-19 15:11:54,363] Trial 26 failed with parameters: {'hidden_dim_h': 50, 'dropout': 0.31019864812263087, 'batch_size': 518} because of the following error: ValueError('zero-size array to reduction operation maximum which has no identity').
Traceback (most recent call last):
  File "/home/juannanzhou/.local/lib/python3.10/site-packages/optuna/study/_optimize.py", line 200, in _run_trial
    value_or_values = func(trial)
  File "/scratch/local/21743416/ipykernel_2182428/3287748320.py", line 55, in objective
    return np.array(r2_test).max()
  File "/apps/pytorch/2.0.1/lib/python3.10/site-packages/numpy/core/_methods.py", line 41, in _amax
    return umr_maximum(a, axis, None, out, keepdims, initial, where)
ValueError: zero-size array to reduction operation maximum which has no identity
[W 2024-01-19 15:11:54,375] Trial 26 failed with value None.


training failed



KeyboardInterrupt



#### 4 layer no softmax

In [128]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 3
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    r2_test.append(pearsonr(pred, true)[0]**2)
    except: print("training failed")
            
    return np.array(r2_test).max()

In [129]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-19 15:12:14,436] A new study created in memory with name: no-name-9c22fc75-c37f-4d92-a0a5-18159ba37298


Epoch 1/200, Loss: 1.5696055261712325
0.5529456622092959
Epoch 11/200, Loss: 0.9873613966138739
0.6208771518192044
Epoch 21/200, Loss: 0.6063449069073326
0.680805688006576
Epoch 31/200, Loss: 0.3713805173572741
0.6989521277159215
Epoch 41/200, Loss: 0.23734470025489204
0.7161684704002198
Epoch 51/200, Loss: 0.16706325819617823
0.7261282661095085
Epoch 61/200, Loss: 0.13284645543286674
0.7208771470468569
Epoch 71/200, Loss: 0.11705594274558519
0.7258383438930762
Epoch 81/200, Loss: 0.10865764986527593
0.7361305773727241
Epoch 91/200, Loss: 0.10254632799248946
0.7330679652102572
Epoch 101/200, Loss: 0.09739686862418526
0.7342193345674372
Epoch 111/200, Loss: 0.09270954641856645
0.7342960008713733
Epoch 121/200, Loss: 0.08720919529074117
0.7321630086391003
Epoch 131/200, Loss: 0.08160967183740515
0.7285754923175938
Epoch 141/200, Loss: 0.07649717636798557
0.733803695173195
Epoch 151/200, Loss: 0.07159466021939327
0.740971019882085
Epoch 161/200, Loss: 0.06661461881901089
0.737974389813457

[I 2024-01-19 15:13:25,875] Trial 0 finished with value: 0.740971019882085 and parameters: {'hidden_dim_h': 25, 'dropout': 0.1534283823499647, 'batch_size': 1077}. Best is trial 0 with value: 0.740971019882085.


Epoch 1/200, Loss: 0.5248821409125077
0.5624418158578562
Epoch 11/200, Loss: 0.34346618150409897
0.6755111385848306
Epoch 21/200, Loss: 0.2604379238266694
0.6116766425039013
Epoch 31/200, Loss: 0.21589773422793337
0.66120080724652
Epoch 41/200, Loss: 0.19785664975643158
0.6931692441134631
Epoch 51/200, Loss: 0.18230046567163968
0.7064577844167955
Epoch 61/200, Loss: 0.1661776453256607
0.719849307107028
Epoch 71/200, Loss: 0.14922057013762624
0.717860345261256
Epoch 81/200, Loss: 0.1335467162885164
0.7242243736839141
Epoch 91/200, Loss: 0.11853236156074624
0.7243316522106902
Epoch 101/200, Loss: 0.104018329789764
0.7172313451399127
Epoch 111/200, Loss: 0.09157252194065797
0.7296722066755272
Epoch 121/200, Loss: 0.0794878845152102
0.7245262934006577
Epoch 131/200, Loss: 0.07011298207860243
0.7274455312582387
Epoch 141/200, Loss: 0.060245658418065624
0.7206732658961307
Epoch 151/200, Loss: 0.052374470978975296
0.722711601456737
Epoch 161/200, Loss: 0.059015750885009766
nan




Epoch 171/200, Loss: 0.26055755191727686
nan
Epoch 181/200, Loss: 0.26063311727423416
nan
Epoch 191/200, Loss: 0.2603272866261633
nan


[W 2024-01-19 15:14:37,409] Trial 1 failed with parameters: {'hidden_dim_h': 26, 'dropout': 0.2940587359822982, 'batch_size': 1077} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:14:37,410] Trial 1 failed with value nan.


Epoch 1/200, Loss: 0.19646501237595523
0.615430393880217
Epoch 11/200, Loss: 0.1209236623512374
0.7015679781752171
Epoch 21/200, Loss: 0.08004889126729083
0.7229956264879851
Epoch 31/200, Loss: 0.055300317221769583
0.7188110483348606
Epoch 41/200, Loss: 0.043111232557782424
0.7185245105625623
Epoch 51/200, Loss: 0.03707526148193412
0.7157374594847548
Epoch 61/200, Loss: 0.03306338418689039
0.7105250665748999
Epoch 71/200, Loss: 0.02973816443786577
0.715038878548661
Epoch 81/200, Loss: 0.02867266853098516
0.7130370693623215
Epoch 91/200, Loss: 0.026931720544342643
0.7122625639023873
Epoch 101/200, Loss: 0.025226954163776502
0.7227081575738042
Epoch 111/200, Loss: 0.024321169937374414
0.7100117478613768
Epoch 121/200, Loss: 0.024166975722268776
0.7135647518178194
Epoch 131/200, Loss: 0.023289341169099014
0.7146286447632135
Epoch 141/200, Loss: 0.022612110780621017
0.7146085240547525
Epoch 151/200, Loss: 0.021903816576081293
0.715176249435508
Epoch 161/200, Loss: 0.021051169304108178
0.71

[I 2024-01-19 15:15:54,601] Trial 2 finished with value: 0.7229956264879851 and parameters: {'hidden_dim_h': 18, 'dropout': 0.0760497865075247, 'batch_size': 375}. Best is trial 0 with value: 0.740971019882085.


Epoch 1/200, Loss: 2.4090633619399298
0.5073264841626564
Epoch 11/200, Loss: 1.5969399951753163
0.5709620335790593
Epoch 21/200, Loss: 1.059831128233955
0.6271508574794442
Epoch 31/200, Loss: 0.7108023422104972
0.6630352145173455
Epoch 41/200, Loss: 0.4969316493897211
0.6960208595481162
Epoch 51/200, Loss: 0.3772945347286406
0.7066787567710844
Epoch 61/200, Loss: 0.3140912481716701
0.7157486937117161
Epoch 71/200, Loss: 0.28176907840229215
0.7179666903659838
Epoch 81/200, Loss: 0.26165815194447833
0.7157420226470899
Epoch 91/200, Loss: 0.24752986431121826
0.7125699314936672
Epoch 101/200, Loss: 0.23426663875579834
0.7091589335408599
Epoch 111/200, Loss: 0.2215866290387653
0.7139989956174376
Epoch 121/200, Loss: 0.20833479932376317
0.703113770358829
Epoch 131/200, Loss: 0.19493646706853593
0.7153008913079908
Epoch 141/200, Loss: 0.1801182883126395
0.7039733138124982
Epoch 151/200, Loss: 0.16574224262010484
0.7195378469408501
Epoch 161/200, Loss: 0.15048898472672417
0.7307285722077838
Ep

[W 2024-01-19 15:17:27,081] Trial 3 failed with parameters: {'hidden_dim_h': 44, 'dropout': 0.31723261993464696, 'batch_size': 973} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:17:27,082] Trial 3 failed with value nan.


Epoch 1/200, Loss: 1.0518915627151728
0.4992992653721001
Epoch 11/200, Loss: 0.2606563469395041
nan
Epoch 21/200, Loss: 0.2606135096400976
nan
Epoch 31/200, Loss: 0.260625892970711
nan
Epoch 41/200, Loss: 0.2606267591007054
nan
Epoch 51/200, Loss: 0.2606043360196054
nan
Epoch 61/200, Loss: 0.2606547435745597
nan
Epoch 71/200, Loss: 0.2606216410174966
nan
Epoch 81/200, Loss: 0.2606831622309983
nan
Epoch 91/200, Loss: 0.2606260610744357
nan
Epoch 101/200, Loss: 0.26059951037168505
nan
Epoch 111/200, Loss: 0.26066343300044537
nan
Epoch 121/200, Loss: 0.2606300665996969
nan
Epoch 131/200, Loss: 0.2606337320059538
nan
Epoch 141/200, Loss: 0.2606751530431211
nan
Epoch 151/200, Loss: 0.26063533704727887
nan
Epoch 161/200, Loss: 0.2606353203766048
nan
Epoch 171/200, Loss: 0.26063744686543944
nan
Epoch 181/200, Loss: 0.26061933478340504
nan
Epoch 191/200, Loss: 0.26064055114984513
nan


[W 2024-01-19 15:19:57,598] Trial 4 failed with parameters: {'hidden_dim_h': 39, 'dropout': 0.3433189469712564, 'batch_size': 125} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:19:57,598] Trial 4 failed with value nan.


Epoch 1/200, Loss: 0.19823337718844414
0.6245690346259052
Epoch 11/200, Loss: 0.13028572276234626
0.7140000924124569
Epoch 21/200, Loss: 0.0994539674371481
0.7256240999870904
Epoch 31/200, Loss: 0.07586099170148372
0.7273324719495594
Epoch 41/200, Loss: 0.05796891935169697
0.738091233871869
Epoch 51/200, Loss: 0.044946618191897866
0.7347259655667876
Epoch 61/200, Loss: 0.034769092500209806
0.7440496299641192
Epoch 71/200, Loss: 0.02888080133125186
0.7368320307246143
Epoch 81/200, Loss: 0.023822276201099158
0.7376722484400575
Epoch 91/200, Loss: 0.020614979695528744
0.7366066547941158
Epoch 101/200, Loss: 0.018425377551466227
0.7368903038400977
Epoch 111/200, Loss: 0.016629743063822387
0.7345015768555794
Epoch 121/200, Loss: 0.015385225135833024
0.7301807406058818
Epoch 131/200, Loss: 0.01448742845095694
0.7309724493156232
Epoch 141/200, Loss: 0.0644594038836658
nan
Epoch 151/200, Loss: 0.2606032632291317
nan
Epoch 161/200, Loss: 0.2606432497501373
nan
Epoch 171/200, Loss: 0.26051423400

[W 2024-01-19 15:21:37,901] Trial 5 failed with parameters: {'hidden_dim_h': 50, 'dropout': 0.11557529084384438, 'batch_size': 1023} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:21:37,902] Trial 5 failed with value nan.


Epoch 1/200, Loss: 0.25173365344872345
0.5636778326724242
Epoch 11/200, Loss: 0.16893755382782705
0.6653804510126535
Epoch 21/200, Loss: 0.12314291177569209
0.6963962550071602
Epoch 31/200, Loss: 0.09358971102817638
0.7033557883525988
Epoch 41/200, Loss: 0.07525038900407585
0.7136615657548191
Epoch 51/200, Loss: 0.06291650517566784
0.7060150971457976
Epoch 61/200, Loss: 0.05669744876590935
0.7081823005884073
Epoch 71/200, Loss: 0.052445453566473885
0.7082303217390563
Epoch 81/200, Loss: 0.04931320441333023
0.7148943491938001
Epoch 91/200, Loss: 0.04712971672415733
0.7131017455774279
Epoch 101/200, Loss: 0.04523243473188297
0.7122696163440702
Epoch 111/200, Loss: 0.044706951625443796
0.7110544894357633
Epoch 121/200, Loss: 0.04315048808584342
0.7173654211792779
Epoch 131/200, Loss: 0.042560471070779336
0.7209062829431004
Epoch 141/200, Loss: 0.041194527737192205
0.7210487019840379
Epoch 151/200, Loss: 0.03987667296786566
0.7150127060061205
Epoch 161/200, Loss: 0.03942309460929922
0.7234

[I 2024-01-19 15:22:43,302] Trial 6 finished with value: 0.7234760472918605 and parameters: {'hidden_dim_h': 10, 'dropout': 0.10824945232454569, 'batch_size': 552}. Best is trial 0 with value: 0.740971019882085.


Epoch 1/200, Loss: 1.4166237732459759
0.5666880405289686
Epoch 11/200, Loss: 0.6772848984290814
0.639857887979002
Epoch 21/200, Loss: 0.3235513660414466
0.6899496858900409
Epoch 31/200, Loss: 0.18448661730207247
0.7114220791972296
Epoch 41/200, Loss: 0.13941154295000538
0.7230527795795961
Epoch 51/200, Loss: 0.12422495874865301
0.7237871015968154
Epoch 61/200, Loss: 0.11512771942492189
0.7186699287037076
Epoch 71/200, Loss: 0.10646749801676848
0.7198008148222647
Epoch 81/200, Loss: 0.09806363079054602
0.7238063497438649
Epoch 91/200, Loss: 0.08934887755533745
0.7203883762039945
Epoch 101/200, Loss: 0.08079567988371027
0.7285156635694311
Epoch 111/200, Loss: 0.07222608489723041
0.7153868107512863
Epoch 121/200, Loss: 0.06397068423443827
0.7186646184959743
Epoch 131/200, Loss: 0.05710211319142375
0.7246909599386334
Epoch 141/200, Loss: 0.05061476382202115
0.7142171592481836
Epoch 151/200, Loss: 0.044848840041407226
0.7189941021140315
Epoch 161/200, Loss: 0.04013531115548364
0.72089294809

[I 2024-01-19 15:23:46,769] Trial 7 finished with value: 0.7285156635694311 and parameters: {'hidden_dim_h': 14, 'dropout': 0.10173738014052287, 'batch_size': 690}. Best is trial 0 with value: 0.740971019882085.


Epoch 1/200, Loss: 0.3359292480680678
0.6151551041214511
Epoch 11/200, Loss: 0.267438648475541
0.7034842186942575
Epoch 21/200, Loss: 0.22985722124576569
0.721470873790889
Epoch 31/200, Loss: 0.19403106222550073
0.7126303609043212
Epoch 41/200, Loss: 0.16109807044267654
0.737671017633143
Epoch 51/200, Loss: 0.13250607293513086
0.7418196213268704
Epoch 61/200, Loss: 0.10826222267415789
0.7390979477275891
Epoch 71/200, Loss: 0.08802246509326829
0.7325726180151825
Epoch 81/200, Loss: 0.07146487509210904
0.7356839779275746
Epoch 91/200, Loss: 0.05790581843919224
0.7351299080786765
Epoch 101/200, Loss: 0.26087242033746505
nan
Epoch 111/200, Loss: 0.26065556704998016
nan
Epoch 121/200, Loss: 0.260530701941914
nan
Epoch 131/200, Loss: 0.2607640003164609
nan
Epoch 141/200, Loss: 0.26029541591803235
nan
Epoch 151/200, Loss: 0.26047004345390534
nan
Epoch 161/200, Loss: 0.26050544364584816
nan
Epoch 171/200, Loss: 0.2607141584157944
nan
Epoch 181/200, Loss: 0.26059000939130783
nan
Epoch 191/200, 

[W 2024-01-19 15:25:15,628] Trial 8 failed with parameters: {'hidden_dim_h': 42, 'dropout': 0.13911569544161834, 'batch_size': 1131} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:25:15,628] Trial 8 failed with value nan.


Epoch 1/200, Loss: 0.21717839719543994
0.6148452592207653
Epoch 11/200, Loss: 0.12297733233008586
0.685181748407459
Epoch 21/200, Loss: 0.08125209462055018
0.7074811077031085
Epoch 31/200, Loss: 0.26053477991634694
nan
Epoch 41/200, Loss: 0.2606057134312643
nan
Epoch 51/200, Loss: 0.26086936534290583
nan
Epoch 61/200, Loss: 0.2601859907449131
nan
Epoch 71/200, Loss: 0.26067582906132014
nan
Epoch 81/200, Loss: 0.26059831406029177
nan
Epoch 91/200, Loss: 0.2606634648752884
nan
Epoch 101/200, Loss: 0.2604732393798694
nan
Epoch 111/200, Loss: 0.2608479399916152
nan
Epoch 121/200, Loss: 0.2610151385757285
nan
Epoch 131/200, Loss: 0.260441231685625
nan
Epoch 141/200, Loss: 0.2604307385397629
nan
Epoch 151/200, Loss: 0.26060593065241694
nan
Epoch 161/200, Loss: 0.2608530431146353
nan
Epoch 171/200, Loss: 0.26039427539832155
nan
Epoch 181/200, Loss: 0.2604962969329995
nan
Epoch 191/200, Loss: 0.26048136156209756
nan


[W 2024-01-19 15:26:57,188] Trial 9 failed with parameters: {'hidden_dim_h': 33, 'dropout': 0.13050350425271906, 'batch_size': 284} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:26:57,189] Trial 9 failed with value nan.


Epoch 1/200, Loss: 0.7188826951574772
0.5925285343340994
Epoch 11/200, Loss: 0.289485421269498
0.7097624074308125
Epoch 21/200, Loss: 0.2304124134652158
0.7162526952622926
Epoch 31/200, Loss: 0.18608099856275193
0.725840200750247
Epoch 41/200, Loss: 0.14162158633166172
0.7170864110261099
Epoch 51/200, Loss: 0.10171088354384646
0.7365221332545772
Epoch 61/200, Loss: 0.07020863692494149
0.7357459191097603
Epoch 71/200, Loss: 0.04859311632970546
0.7275669252795415
Epoch 81/200, Loss: 0.03358873697195915
0.7347210361130287
Epoch 91/200, Loss: 0.024983339883545612
0.7257506293137753
Epoch 101/200, Loss: 0.020068890276424427
0.7302005222299006
Epoch 111/200, Loss: 0.01754085111253439
0.7225548328561344
Epoch 121/200, Loss: 0.04763581958460681
nan
Epoch 131/200, Loss: 0.2603533442350144
nan
Epoch 141/200, Loss: 0.2610752202094869
nan
Epoch 151/200, Loss: 0.26037002656053987
nan
Epoch 161/200, Loss: 0.2610004296962251
nan
Epoch 171/200, Loss: 0.26115348079103107
nan
Epoch 181/200, Loss: 0.2607

[W 2024-01-19 15:28:17,415] Trial 10 failed with parameters: {'hidden_dim_h': 25, 'dropout': 0.050221968675879095, 'batch_size': 432} because of the following error: The value nan is not acceptable.
[W 2024-01-19 15:28:17,416] Trial 10 failed with value nan.


Epoch 1/200, Loss: 0.6715015983581543
0.6115021833556807
Epoch 11/200, Loss: 0.30095691442489625
0.7056127117981499
Epoch 21/200, Loss: 0.175057989358902
0.7176433140504613
Epoch 31/200, Loss: 0.13938152611255647
0.7192536134482647


[I 2024-01-19 15:28:32,544] Trial 11 finished with value: 0.7192536134482647 and parameters: {'hidden_dim_h': 32, 'dropout': 0.05915782485824798, 'batch_size': 819}. Best is trial 0 with value: 0.740971019882085.


training failed
Epoch 1/200, Loss: 0.8492783451902455
0.5291646201454576


[I 2024-01-19 15:28:34,588] Trial 12 finished with value: 0.5291646201454576 and parameters: {'hidden_dim_h': 11, 'dropout': 0.1443183799513162, 'batch_size': 345}. Best is trial 0 with value: 0.740971019882085.
[W 2024-01-19 15:28:34,763] Trial 13 failed with parameters: {'hidden_dim_h': 42, 'dropout': 0.2310983019479136, 'batch_size': 948} because of the following error: ValueError('zero-size array to reduction operation maximum which has no identity').
Traceback (most recent call last):
  File "/home/juannanzhou/.local/lib/python3.10/site-packages/optuna/study/_optimize.py", line 200, in _run_trial
    value_or_values = func(trial)
  File "/scratch/local/21743416/ipykernel_2182428/1232726190.py", line 55, in objective
    return np.array(r2_test).max()
  File "/apps/pytorch/2.0.1/lib/python3.10/site-packages/numpy/core/_methods.py", line 41, in _amax
    return umr_maximum(a, axis, None, out, keepdims, initial, where)
ValueError: zero-size array to reduction operation maximum which 

training failed
training failed


ValueError: zero-size array to reduction operation maximum which has no identity

In [130]:
w = torch.rand(100, 10, 10)

In [139]:
w = torch.softmax(w, 0)

In [140]:
w.sum()

tensor(100.)

In [None]:
def softmax(input: Tensor, dim: Optional[int] = None, _stacklevel: int = 3, dtype: Optional[DType] = None) -> Tensor:
    r"""Applies a softmax function.

    Softmax is defined as:

    :math:`\text{Softmax}(x_{i}) = \frac{\exp(x_i)}{\sum_j \exp(x_j)}`

    It is applied to all slices along dim, and will re-scale them so that the elements
    lie in the range `[0, 1]` and sum to 1.

    See :class:`~torch.nn.Softmax` for more details.

    Args:
        input (Tensor): input
        dim (int): A dimension along which softmax will be computed.
        dtype (:class:`torch.dtype`, optional): the desired data type of returned tensor.
          If specified, the input tensor is casted to :attr:`dtype` before the operation
          is performed. This is useful for preventing data type overflows. Default: None.

    .. note::
        This function doesn't work directly with NLLLoss,
        which expects the Log to be computed between the Softmax and itself.
        Use log_softmax instead (it's faster and has better numerical properties).

    """
    if has_torch_function_unary(input):
        return handle_torch_function(softmax, (input,), input, dim=dim, _stacklevel=_stacklevel, dtype=dtype)
    if dim is None:
        dim = _get_softmax_dim("softmax", input.dim(), _stacklevel)
    if dtype is None:
        ret = input.softmax(dim)
    else:
        ret = input.softmax(dim, dtype=dtype)
    return ret


### 2 layers modified softmax

In [162]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 2
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    if pearsonr(pred, true)[0]**2 == "nan":
                        break
                    r2_test.append(pearsonr(pred, true)[0]**2)
                    
    except: print("training failed")
            
    return np.array(r2_test).max()

In [163]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-21 07:52:43,020] A new study created in memory with name: no-name-3094af1d-4733-4943-a660-30b1af30aaa1


Epoch 1/200, Loss: 0.741008934047487
0.5799706222931238
Epoch 11/200, Loss: 0.4745582557386822
0.6209996219922811
Epoch 21/200, Loss: 0.3358950747383965
0.019663381102147034
Epoch 31/200, Loss: 0.27558664480845135
0.024715100806410917
Epoch 41/200, Loss: 0.25908704350392026
0.04270048100175921
Epoch 51/200, Loss: 0.25776147180133396
0.05828036624597039
Epoch 61/200, Loss: 0.2565258964896202
0.051009016541516544
Epoch 71/200, Loss: 0.2578274740113152
0.02268331969275753
Epoch 81/200, Loss: 0.25691848662164474
0.027507621120933405
Epoch 91/200, Loss: 0.2566315333048503
0.0624154162493383
Epoch 101/200, Loss: 0.25770995186434853
0.04137243499929398
Epoch 111/200, Loss: 0.2581830422083537
0.040451395959387564
Epoch 121/200, Loss: 0.2579670457376374
0.04571446986688595
Epoch 131/200, Loss: 0.2564760380321079
0.06590353845145859
Epoch 141/200, Loss: 0.25675996558533776
0.04924042830068256
Epoch 151/200, Loss: 0.255427237186167
0.0587953031915718
Epoch 161/200, Loss: 0.2554900373021762
0.0586

[I 2024-01-21 07:53:50,283] Trial 0 finished with value: 0.6209996219922811 and parameters: {'hidden_dim_h': 37, 'dropout': 0.09373644679581783, 'batch_size': 1138}. Best is trial 0 with value: 0.6209996219922811.


Epoch 1/200, Loss: 1.2905769073046172
0.5098594408104166
Epoch 11/200, Loss: 0.44105472472997814
0.5883436265118853
Epoch 21/200, Loss: 0.1652548366632217
0.6558475716147668
Epoch 31/200, Loss: 0.1068401798988
0.6639088015943411
Epoch 41/200, Loss: 0.09608879475257336
0.6767865995299699
Epoch 51/200, Loss: 0.09192634564943802
0.6830979722405155
Epoch 61/200, Loss: 0.08733882583104648
0.6885499110166958
Epoch 71/200, Loss: 0.26674870115060073
0.002091045820084161
Epoch 81/200, Loss: 0.26161317832959
0.000524525969706192
Epoch 91/200, Loss: 0.26401450083805966
0.02280615407935569
Epoch 101/200, Loss: 0.2624458724107498
0.008925806068360785
Epoch 111/200, Loss: 0.262218992297466
0.01840978159979542
Epoch 121/200, Loss: 0.2594477373820085
0.025422055966088857
Epoch 131/200, Loss: 0.25948197146256763
0.022966233423800976
Epoch 141/200, Loss: 0.2598698039849599
0.022532756246076324
Epoch 151/200, Loss: 0.2589315458750113
0.02497221124125527
Epoch 161/200, Loss: 0.25853944283265334
0.02924797

[I 2024-01-21 07:55:08,103] Trial 1 finished with value: 0.6885499110166958 and parameters: {'hidden_dim_h': 44, 'dropout': 0.25300407113702317, 'batch_size': 517}. Best is trial 1 with value: 0.6885499110166958.


Epoch 1/200, Loss: 0.2512191430880473
0.5542194471451242
Epoch 11/200, Loss: 0.20850110684449857
0.6197719966699271
Epoch 21/200, Loss: 0.17468745376055056
0.6515929301719234
Epoch 31/200, Loss: 0.14720594711028612
0.6637166168272343
Epoch 41/200, Loss: 0.12505645792071635
0.6842675560382933
Epoch 51/200, Loss: 0.10879465249868539
0.6869159743631458
Epoch 61/200, Loss: 0.0934253461085833
0.7027368308347213
Epoch 71/200, Loss: 0.08299155963154939
0.7072396401231761
Epoch 81/200, Loss: 0.07533822122674722
0.714060005451026
Epoch 91/200, Loss: 0.06943681377630967
0.716716909543698
Epoch 101/200, Loss: 0.0653636368134847
0.7251898151440901
Epoch 111/200, Loss: 0.06226502516521858
0.7320371054160696
Epoch 121/200, Loss: 0.060215688668764554
0.7311983067781057
Epoch 131/200, Loss: 0.05870053759561135
0.7325712937806765
Epoch 141/200, Loss: 0.057034884937680684
0.73262407381962
Epoch 151/200, Loss: 0.05588428031366605
0.730226809215349
Epoch 161/200, Loss: 0.05434054981630582
0.73379257724754

[I 2024-01-21 07:56:01,749] Trial 2 finished with value: 0.7384353769575507 and parameters: {'hidden_dim_h': 12, 'dropout': 0.09103452059887784, 'batch_size': 783}. Best is trial 2 with value: 0.7384353769575507.


Epoch 1/200, Loss: 0.23237790167331696
0.563474503701154
Epoch 11/200, Loss: 0.168749682881214
0.650357209380276
Epoch 21/200, Loss: 0.1372361174888081
0.6603036559522317
Epoch 31/200, Loss: 0.1130937288204829
0.6723064326683263
Epoch 41/200, Loss: 0.09483210466526172
0.696467777416646
Epoch 51/200, Loss: 0.08062996715307236
0.7099259455981664
Epoch 61/200, Loss: 0.07150224499680378
0.7114975638594208
Epoch 71/200, Loss: 0.06225388193572009
0.7242300587409097
Epoch 81/200, Loss: 0.05715651106503275
0.726439835649284
Epoch 91/200, Loss: 0.050116744030404975
0.7364728737368917
Epoch 101/200, Loss: 0.04652337274617619
0.7371120121066408
Epoch 111/200, Loss: 0.04332536693524431
0.7377767288208951
Epoch 121/200, Loss: 0.04208471432880119
0.7293680904352375
Epoch 131/200, Loss: 0.03726117768221431
0.73824172471092
Epoch 141/200, Loss: 0.03610517381242028
0.7331501935226559
Epoch 151/200, Loss: 0.03316733530826039
0.7372994595772184
Epoch 161/200, Loss: 0.03176689251429505
0.7407054065243591


[I 2024-01-21 07:57:10,492] Trial 3 finished with value: 0.7410772353227911 and parameters: {'hidden_dim_h': 37, 'dropout': 0.07908280603213001, 'batch_size': 742}. Best is trial 3 with value: 0.7410772353227911.


Epoch 1/200, Loss: 0.2400756451216611
0.5621129854081837
Epoch 11/200, Loss: 0.19839864427393133
0.6149420971472142
Epoch 21/200, Loss: 0.1737301993099126
0.6415564387644569
Epoch 31/200, Loss: 0.15173348784446716
0.6500002752012121
Epoch 41/200, Loss: 0.1366283463483507
0.6570653284969443
Epoch 51/200, Loss: 0.11933204938064922
0.6700672554398666
Epoch 61/200, Loss: 0.10748260502110828
0.6779507875969536
Epoch 71/200, Loss: 0.09630948576060208
0.6889247736935226
Epoch 81/200, Loss: 0.08813878047195348
0.6990435286723173
Epoch 91/200, Loss: 0.08234277401458133
0.7033402865229977
Epoch 101/200, Loss: 0.07755001905289563
0.7094530908752563
Epoch 111/200, Loss: 0.07246750830249353
0.7145989622374453
Epoch 121/200, Loss: 0.06986486488445239
0.7182285045706845
Epoch 131/200, Loss: 0.06754429926249114
0.7260924205320249
Epoch 141/200, Loss: 0.06470574709502133
0.7241910280584022
Epoch 151/200, Loss: 0.06346729939634149
0.7318832481521298
Epoch 161/200, Loss: 0.062414235350760544
0.7304723486

[I 2024-01-21 07:58:06,808] Trial 4 finished with value: 0.7387994831024697 and parameters: {'hidden_dim_h': 17, 'dropout': 0.22219324499362597, 'batch_size': 948}. Best is trial 3 with value: 0.7410772353227911.


Epoch 1/200, Loss: 0.671419002793052
0.5557711374798505
Epoch 11/200, Loss: 0.29965555938807403
0.5961533608481069
Epoch 21/200, Loss: 0.1604174409400333
0.6391109357188405
Epoch 31/200, Loss: 0.11740462719039484
0.6538759280586192
Epoch 41/200, Loss: 0.10475496270439842
0.6735014034072807
Epoch 51/200, Loss: 0.10013283484361389
0.6783013366951975
Epoch 61/200, Loss: 0.09638392891396176
0.6886540300489605
Epoch 71/200, Loss: 0.0926846634935249
0.7008662117618701
Epoch 81/200, Loss: 0.08883136307651346
0.6999993292579056
Epoch 91/200, Loss: 0.08611157773570581
0.7122924514744443
Epoch 101/200, Loss: 0.08318410475145686
0.7117285164300522
Epoch 111/200, Loss: 0.07941076870669019
0.7177737193961249
Epoch 121/200, Loss: 0.07684768702496182
0.7229517286928743
Epoch 131/200, Loss: 0.07419703528285027
0.725935495846027
Epoch 141/200, Loss: 0.07202375070615248
0.7261510602445347
Epoch 151/200, Loss: 0.06983480365438895
0.7329261568745945
Epoch 161/200, Loss: 0.06762803887779062
0.7316068267123

[I 2024-01-21 07:58:59,950] Trial 5 finished with value: 0.7402138516935 and parameters: {'hidden_dim_h': 15, 'dropout': 0.31400531487540595, 'batch_size': 925}. Best is trial 3 with value: 0.7410772353227911.


Epoch 1/200, Loss: 1.9831012884775798
0.5661457068567883
Epoch 11/200, Loss: 1.290617755481175
0.5766742700850188
Epoch 21/200, Loss: 0.8501273620696295
0.6107696921670015
Epoch 31/200, Loss: 0.5842441859699431
0.6203612294222323
Epoch 41/200, Loss: 0.419183516786212
0.009676089089488657
Epoch 51/200, Loss: 0.3228562729699271
0.001521379883815768
Epoch 61/200, Loss: 0.28131240606307983
0.0025021354768540874
Epoch 71/200, Loss: 0.2667427864812669
0.0011511550406127123
Epoch 81/200, Loss: 0.26151630921023233
0.001481433288160976
Epoch 91/200, Loss: 0.2611117909351985
0.0007414421678186611
Epoch 101/200, Loss: 0.2606714892955053
0.003420970108981865
Epoch 111/200, Loss: 0.2604507505893707
0.006803390252323901
Epoch 121/200, Loss: 0.2604640090749377
0.007210209350659857
Epoch 131/200, Loss: 0.26013374754360746
0.007477555784029624
Epoch 141/200, Loss: 0.26001939958050135
0.00736699331487223
Epoch 151/200, Loss: 0.2602595346314566
0.017925842569416824
Epoch 161/200, Loss: 0.2592660578943434

[I 2024-01-21 08:00:09,904] Trial 6 finished with value: 0.6203612294222323 and parameters: {'hidden_dim_h': 40, 'dropout': 0.2798870799107676, 'batch_size': 966}. Best is trial 3 with value: 0.7410772353227911.


Epoch 1/200, Loss: 0.5124843083322048
0.5619006398163873
Epoch 11/200, Loss: 0.2961839747925599
0.6214026022229158
Epoch 21/200, Loss: 0.24672681031127772
0.634341955046343
Epoch 31/200, Loss: 0.22313145734369755
0.6508187221376491
Epoch 41/200, Loss: 0.20034954883158207
0.5902019200353774
Epoch 51/200, Loss: 0.1770040219028791
0.6753796190888716
Epoch 61/200, Loss: 0.15499980126818022
0.6717222722931692
Epoch 71/200, Loss: 0.13508528160552183
0.6738314196684211
Epoch 81/200, Loss: 0.11684361379593611
0.6861597285934605
Epoch 91/200, Loss: 0.10142739831159513
0.718123373626676
Epoch 101/200, Loss: 0.08834695847084124
0.6927141188715888
Epoch 111/200, Loss: 0.07805196413149436
0.7131418071244398
Epoch 121/200, Loss: 0.06930345265815656
0.7126250359052635
Epoch 131/200, Loss: 0.06264282825092475
0.7364795886758286
Epoch 141/200, Loss: 0.05766416278978189
0.7189275132747871
Epoch 151/200, Loss: 0.05320757472266754
0.7364325597510534
Epoch 161/200, Loss: 0.05089791320885221
0.7409782696325

[I 2024-01-21 08:01:05,512] Trial 7 finished with value: 0.7415451157653813 and parameters: {'hidden_dim_h': 16, 'dropout': 0.08903441392164732, 'batch_size': 838}. Best is trial 7 with value: 0.7415451157653813.


Epoch 1/200, Loss: 0.16055543379237255
0.5905786897664752
Epoch 11/200, Loss: 0.10732166732971866
0.6561527239667555
Epoch 21/200, Loss: 0.0904753531018893
0.6811798679968
Epoch 31/200, Loss: 0.08138729414592187
0.6892348327370702
Epoch 41/200, Loss: 0.07656641180316608
0.6990303731295985
Epoch 51/200, Loss: 0.07265646957481901
0.7111367806077706
Epoch 61/200, Loss: 0.06789438977527122
0.7209507955747512
Epoch 71/200, Loss: 0.06307310502355297
0.7262541592380518
Epoch 81/200, Loss: 0.06146806517305473
0.7271947947930109
Epoch 91/200, Loss: 0.057732421128700175
0.7298343432110828
Epoch 101/200, Loss: 0.05532078739876548
0.7322972824508206
Epoch 111/200, Loss: 0.05180304187039534
0.7326324814186943
Epoch 121/200, Loss: 0.05116363971804579
0.7344608294267141
Epoch 131/200, Loss: 0.0476096470374614
0.7341792233530186
Epoch 141/200, Loss: 0.04512215033173561
0.7379308326358672
Epoch 151/200, Loss: 0.04292187017078201
0.7393297563706723
Epoch 161/200, Loss: 0.04204052803106606
0.740884100250

[I 2024-01-21 08:02:14,993] Trial 8 finished with value: 0.7419001965183424 and parameters: {'hidden_dim_h': 32, 'dropout': 0.11630754067624618, 'batch_size': 423}. Best is trial 8 with value: 0.7419001965183424.


Epoch 1/200, Loss: 0.18514998789344514
0.58213201128964
Epoch 11/200, Loss: 0.14485238194465638
0.6334079581188962
Epoch 21/200, Loss: 0.12287783601454326
0.6604295694130392
Epoch 31/200, Loss: 0.1114830378975187
0.6642341878140767
Epoch 41/200, Loss: 0.09429427087306977
0.6743142460698405
Epoch 51/200, Loss: 0.08605881418500627
0.6828972554729952
Epoch 61/200, Loss: 0.09300471033368791
0.6814028330922334
Epoch 71/200, Loss: 0.08878785393067769
0.6858587027456486
Epoch 81/200, Loss: 0.07780546599200794
0.706370062549569
Epoch 91/200, Loss: 0.07424481276954924
0.7089988107255328
Epoch 101/200, Loss: 0.07625552713871002
0.7074050027467547
Epoch 111/200, Loss: 0.0721303973879133
0.7111930592658962
Epoch 121/200, Loss: 0.07595506267888205
0.7077886123214255
Epoch 131/200, Loss: 0.0658745097794703
0.7203233457468149
Epoch 141/200, Loss: 0.0805027846779142
0.7009412023606312
Epoch 151/200, Loss: 0.06788637712597848
0.7202387522152398
Epoch 161/200, Loss: 0.06544919801609857
0.717537914426276

[I 2024-01-21 08:03:20,107] Trial 9 finished with value: 0.7325754549594626 and parameters: {'hidden_dim_h': 32, 'dropout': 0.10063114077820262, 'batch_size': 588}. Best is trial 8 with value: 0.7419001965183424.


Epoch 1/200, Loss: 1.718220736226465
0.5359472010443116
Epoch 11/200, Loss: 0.2764068333766399
0.009785388709325188
Epoch 21/200, Loss: 0.24598766417584866
0.034758351973465454
Epoch 31/200, Loss: 0.2403490994221125
0.07294481452874119
Epoch 41/200, Loss: 0.2385797313390634
0.06369757199698348
Epoch 51/200, Loss: 0.23921759604898274
0.05732842631025185
Epoch 61/200, Loss: 0.2402225728982534
0.05324022762510527
Epoch 71/200, Loss: 0.2409645173794184
0.06903295810606205
Epoch 81/200, Loss: 0.23655057405559426
0.06448131131708662
Epoch 91/200, Loss: 0.23572933635650536
0.055256814970295436
Epoch 101/200, Loss: 0.23770785242573828
0.08406165631740985
Epoch 111/200, Loss: 0.2336508695386414
0.10513975640895067
Epoch 121/200, Loss: 0.23553174886948022
0.07780022714176633
Epoch 131/200, Loss: 0.23810338146156734
0.10624903199909216
Epoch 141/200, Loss: 0.23515232009255987
0.10225577676782045
Epoch 151/200, Loss: 0.2367712556042223
0.09486996125101485
Epoch 161/200, Loss: 0.23956523886603168
0

[I 2024-01-21 08:05:13,716] Trial 10 finished with value: 0.5359472010443116 and parameters: {'hidden_dim_h': 50, 'dropout': 0.16789704857462576, 'batch_size': 172}. Best is trial 8 with value: 0.7419001965183424.


Epoch 1/200, Loss: 3.2596952828493984
0.4638360769639689
Epoch 11/200, Loss: 1.282093713500283
0.5760286214202125
Epoch 21/200, Loss: 0.5219336401332508
0.6310869935959381
Epoch 31/200, Loss: 0.3136457565155896
0.6463232117667563
Epoch 41/200, Loss: 0.2666335636919195
0.6514351356877397
Epoch 51/200, Loss: 0.2401546380736611
0.653716062061867
Epoch 61/200, Loss: 0.21124744008887897
0.6705535695110892
Epoch 71/200, Loss: 0.1786173714832826
0.6827088280791819
Epoch 81/200, Loss: 0.1467928244308992
0.701888347028742
Epoch 91/200, Loss: 0.11804961291226473
0.7177081725093636
Epoch 101/200, Loss: 0.09383093592795459
0.7252560886697227
Epoch 111/200, Loss: 0.0753945074298165
0.7214784335139374
Epoch 121/200, Loss: 0.061552670394832434
0.7339035763895223
Epoch 131/200, Loss: 0.054150015115737915
0.7359576227662624
Epoch 141/200, Loss: 0.05016227384859866
0.7383178499847336
Epoch 151/200, Loss: 0.046305530586025934
0.7420316363602217
Epoch 161/200, Loss: 0.04461178556084633
0.737987444947576
E

[I 2024-01-21 08:06:22,048] Trial 11 finished with value: 0.7420316363602217 and parameters: {'hidden_dim_h': 24, 'dropout': 0.14960810032415595, 'batch_size': 369}. Best is trial 11 with value: 0.7420316363602217.


Epoch 1/200, Loss: 0.35175927031424736
0.5842061021182459
Epoch 11/200, Loss: 0.15414473823001307
0.6498629144153713
Epoch 21/200, Loss: 0.12502926744280324
0.6653225003770599
Epoch 31/200, Loss: 0.10176421846112897
0.6701520767567751
Epoch 41/200, Loss: 0.0866716859802123
0.6885874550015921
Epoch 51/200, Loss: 0.07860597018753329
0.7029500496113871
Epoch 61/200, Loss: 0.07276742869327145
0.7192199515156183
Epoch 71/200, Loss: 0.06881610358193997
0.7179928379227947
Epoch 81/200, Loss: 0.06622352583273765
0.7299577215718998
Epoch 91/200, Loss: 0.06307139013323092
0.7366559438679984
Epoch 101/200, Loss: 0.0622157231574097
0.7273899501481513
Epoch 111/200, Loss: 0.05803683075693346
0.742919609215753
Epoch 121/200, Loss: 0.05622551500076248
0.7443206468712248
Epoch 131/200, Loss: 0.05278481038347367
0.7418419714415044
Epoch 141/200, Loss: 0.05152450796336897
0.7473107361183652
Epoch 151/200, Loss: 0.04915272708862058
0.7422768230898988
Epoch 161/200, Loss: 0.048480381708472006
0.7434174480

[I 2024-01-21 08:07:36,478] Trial 12 finished with value: 0.7473107361183652 and parameters: {'hidden_dim_h': 26, 'dropout': 0.1678093997237562, 'batch_size': 327}. Best is trial 12 with value: 0.7473107361183652.


Epoch 1/200, Loss: 0.35246084423004825
0.5809034659850083
Epoch 11/200, Loss: 0.18071455951732926
0.6465669077924846
Epoch 21/200, Loss: 0.13262282274191892
0.6639053293798788
Epoch 31/200, Loss: 0.1014038033877747
0.6635455111765001
Epoch 41/200, Loss: 0.08517783484126948
0.6919856411062039
Epoch 51/200, Loss: 0.07846503921701939
0.6979807266025229
Epoch 61/200, Loss: 0.0744795058441313
0.703085579539641
Epoch 71/200, Loss: 0.06985597501072703
0.7130930445156363
Epoch 81/200, Loss: 0.06791246913467781
0.7181625222838145
Epoch 91/200, Loss: 0.06585751426748082
0.7268573029756392
Epoch 101/200, Loss: 0.06342895083789583
0.7261043768571478
Epoch 111/200, Loss: 0.06139718995818609
0.7284181701746891
Epoch 121/200, Loss: 0.0591205358505249
0.7318247502020234
Epoch 131/200, Loss: 0.05688437814765339
0.7358657811648784
Epoch 141/200, Loss: 0.05568049980115287
0.7273765519621774
Epoch 151/200, Loss: 0.053949009532792656
0.727010586463242
Epoch 161/200, Loss: 0.052454369496318355
0.74003746786

[I 2024-01-21 08:08:56,172] Trial 13 finished with value: 0.7400374678654627 and parameters: {'hidden_dim_h': 22, 'dropout': 0.1679958582398178, 'batch_size': 254}. Best is trial 12 with value: 0.7473107361183652.


Epoch 1/200, Loss: 0.21736054191222556
0.5860488696907503
Epoch 11/200, Loss: 0.14137320484106358
0.6422308855657278
Epoch 21/200, Loss: 0.10648490362442457
0.6687902976421191
Epoch 31/200, Loss: 0.08952256750601989
0.6804541169981413
Epoch 41/200, Loss: 0.08007294168839088
0.6968080011309911
Epoch 51/200, Loss: 0.07413650235304466
0.7085815296071959
Epoch 61/200, Loss: 0.06978958357985203
0.7052831108977548
Epoch 71/200, Loss: 0.0656268277993569
0.7167228089968838
Epoch 81/200, Loss: 0.06254499078943179
0.7219014936571755
Epoch 91/200, Loss: 0.058782616945413445
0.7231048080734047
Epoch 101/200, Loss: 0.0561888901086954
0.7280865457172315
Epoch 111/200, Loss: 0.05380736406032856
0.7282932139541026
Epoch 121/200, Loss: 0.05193044709471556
0.7378389410985845
Epoch 131/200, Loss: 0.05014440921636728
0.7334134954675463
Epoch 141/200, Loss: 0.048632834679805316
0.734868170748368
Epoch 151/200, Loss: 0.04715246254434952
0.7386422347721785
Epoch 161/200, Loss: 0.045944133744790006
0.74180761

[I 2024-01-21 08:10:09,698] Trial 14 finished with value: 0.7481291388823108 and parameters: {'hidden_dim_h': 24, 'dropout': 0.1644199994509371, 'batch_size': 308}. Best is trial 14 with value: 0.7481291388823108.


Epoch 1/200, Loss: 0.24803855438737105
0.5714147186746137
Epoch 11/200, Loss: 0.1273532452156944
0.6401543501951531
Epoch 21/200, Loss: 0.09389614172442987
0.6667343824371157
Epoch 31/200, Loss: 0.08636055427202344
0.6887544555027709
Epoch 41/200, Loss: 0.08282821448723765
0.6907628021659601
Epoch 51/200, Loss: 0.07887497000450636
0.6887627009430424
Epoch 61/200, Loss: 0.07552511383690973
0.7114561947572025
Epoch 71/200, Loss: 0.07213229294458445
0.7122308169171976
Epoch 81/200, Loss: 0.06929144056609077
0.7067400761954555
Epoch 91/200, Loss: 0.06653431996050542
0.7201920139540233
Epoch 101/200, Loss: 0.06346801195266473
0.7245191903349449
Epoch 111/200, Loss: 0.06177457693937051
0.7311104520353423
Epoch 121/200, Loss: 0.06059694600148793
0.7319734120926971
Epoch 131/200, Loss: 0.05903768449695441
0.7373668222784111
Epoch 141/200, Loss: 0.05646592174677083
0.734550315268019
Epoch 151/200, Loss: 0.05554588998321199
0.7313163589767214
Epoch 161/200, Loss: 0.053852618284469106
0.737823433

[I 2024-01-21 08:12:02,084] Trial 15 finished with value: 0.739922530021854 and parameters: {'hidden_dim_h': 25, 'dropout': 0.20476160625393378, 'batch_size': 146}. Best is trial 14 with value: 0.7481291388823108.


Epoch 1/200, Loss: 0.3467962789748396
0.5873168790326447
Epoch 11/200, Loss: 0.21342705376446247
0.6419852513496804
Epoch 21/200, Loss: 0.14957972376474313
0.6696658592782695
Epoch 31/200, Loss: 0.10998026414641313
0.6878365192046706
Epoch 41/200, Loss: 0.08892933665109533
0.7029749582735216
Epoch 51/200, Loss: 0.0772894407356424
0.7066421020849539
Epoch 61/200, Loss: 0.07134646456688643
0.7189988757484214
Epoch 71/200, Loss: 0.06715903584180134
0.7216125795846738
Epoch 81/200, Loss: 0.06472265500841397
0.7335367807858937
Epoch 91/200, Loss: 0.06179007788055709
0.7242236020468416
Epoch 101/200, Loss: 0.060071792852665694
0.7371081639710131
Epoch 111/200, Loss: 0.05833153945526907
0.7409248243212133
Epoch 121/200, Loss: 0.05537425387384636
0.7391212303477431
Epoch 131/200, Loss: 0.05431403306179813
0.7511851205611119
Epoch 141/200, Loss: 0.05401110489453588
0.7479814884117499
Epoch 151/200, Loss: 0.05032905803195068
0.7496524004430679
Epoch 161/200, Loss: 0.04945294598915747
0.748261280

[I 2024-01-21 08:13:14,605] Trial 16 finished with value: 0.756164132510553 and parameters: {'hidden_dim_h': 28, 'dropout': 0.1400993933263601, 'batch_size': 362}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.22744004496119238
0.5793314348799237
Epoch 11/200, Loss: 0.15067924389784987
0.6507595326503106
Epoch 21/200, Loss: 0.11355290358716791
0.6622670017716967
Epoch 31/200, Loss: 0.09371467476541345
0.6797744705115237
Epoch 41/200, Loss: 0.0816733662716367
0.6982010912554296
Epoch 51/200, Loss: 0.07424073378470811
0.7111154563017819
Epoch 61/200, Loss: 0.06896479614078999
0.7247338401768777
Epoch 71/200, Loss: 0.06492437092079358
0.726355889650256
Epoch 81/200, Loss: 0.06128431120040742
0.7350110505669472
Epoch 91/200, Loss: 0.05849444561383941
0.7368698659331147
Epoch 101/200, Loss: 0.05515865346586162
0.7445454690177961
Epoch 111/200, Loss: 0.054163316772742706
0.7412079377746075
Epoch 121/200, Loss: 0.051392013376409355
0.7415228775154571
Epoch 131/200, Loss: 0.05025917655703696
0.7461830924200858
Epoch 141/200, Loss: 0.048603427173061806
0.7442183449979016
Epoch 151/200, Loss: 0.047219117934053596
0.7466535553171689
Epoch 161/200, Loss: 0.04700925421308388
0.751314

[I 2024-01-21 08:14:18,677] Trial 17 finished with value: 0.7530257510189344 and parameters: {'hidden_dim_h': 20, 'dropout': 0.13440412193045204, 'batch_size': 462}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.41597603418325124
0.5474475772358164
Epoch 11/200, Loss: 0.20797875092217796
0.6095041112792824
Epoch 21/200, Loss: 0.1769865743423763
0.644653683189869
Epoch 31/200, Loss: 0.1489925792342738
0.6720045083987959
Epoch 41/200, Loss: 0.1236559652576321
0.6824189471220458
Epoch 51/200, Loss: 0.10471160141261
0.6992473654063852
Epoch 61/200, Loss: 0.08872913235896512
0.6956294306168818
Epoch 71/200, Loss: 0.07800200561943807
0.708093192265945
Epoch 81/200, Loss: 0.07129717657440587
0.7057102728486224
Epoch 91/200, Loss: 0.06603436162205119
0.7111111562760917
Epoch 101/200, Loss: 0.06311900511776146
0.7155834360343842
Epoch 111/200, Loss: 0.06062218448833415
0.7176193309527891
Epoch 121/200, Loss: 0.058652387539807116
0.7222300948818836
Epoch 131/200, Loss: 0.05737192938594442
0.7197138757343765
Epoch 141/200, Loss: 0.05621746231458689
0.7258562754688899
Epoch 151/200, Loss: 0.0556394568595447
0.7237620730682098
Epoch 161/200, Loss: 0.054573976483784224
0.726581890869233

[I 2024-01-21 08:15:15,342] Trial 18 finished with value: 0.7314679689210527 and parameters: {'hidden_dim_h': 10, 'dropout': 0.055830168752134104, 'batch_size': 536}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.3269305635582317
0.5457301651812861
Epoch 11/200, Loss: 0.20715263282710855
0.6314092408762368
Epoch 21/200, Loss: 0.1603857163678516
0.659066422486357
Epoch 31/200, Loss: 0.1258173334327611
0.6712408734145615
Epoch 41/200, Loss: 0.1023291229185733
0.6790575534538345
Epoch 51/200, Loss: 0.08632556586103006
0.6980967832893169
Epoch 61/200, Loss: 0.07784246483987028
0.7119282736431364
Epoch 71/200, Loss: 0.07076719530265439
0.7216794976970152
Epoch 81/200, Loss: 0.06713868440552191
0.7282780977792432
Epoch 91/200, Loss: 0.06355647209354422
0.7280017131550072
Epoch 101/200, Loss: 0.060884160582314835
0.7353031095482138
Epoch 111/200, Loss: 0.05737811860374429
0.7425030307005435
Epoch 121/200, Loss: 0.05616378953511065
0.7423672909017865
Epoch 131/200, Loss: 0.05374487277797677
0.7434081190621659
Epoch 141/200, Loss: 0.052061585540121254
0.750595098778585
Epoch 151/200, Loss: 0.05148741907694123
0.7435955489622105
Epoch 161/200, Loss: 0.049667065370489254
0.74613319924

[I 2024-01-21 08:16:19,444] Trial 19 finished with value: 0.750595098778585 and parameters: {'hidden_dim_h': 20, 'dropout': 0.13294929145676015, 'batch_size': 462}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.23609976662743476
0.5897773067099882
Epoch 11/200, Loss: 0.17194616169698776
0.6390206981429507
Epoch 21/200, Loss: 0.13579297642554006
0.6521470834059725
Epoch 31/200, Loss: 0.11312736691005769
0.6672667142378114
Epoch 41/200, Loss: 0.09638983900508573
0.6741309668791575
Epoch 51/200, Loss: 0.08574401923725682
0.7005532471385119
Epoch 61/200, Loss: 0.07731594601946493
0.7062810495106668
Epoch 71/200, Loss: 0.07188960188819517
0.7113678331325229
Epoch 81/200, Loss: 0.0675460634933364
0.7180372579651774
Epoch 91/200, Loss: 0.06348969667188582
0.727929897928836
Epoch 101/200, Loss: 0.06044639118256107
0.7309736754816698
Epoch 111/200, Loss: 0.05792486775786646
0.7314650786613719
Epoch 121/200, Loss: 0.055858828247554844
0.7355074383310477
Epoch 131/200, Loss: 0.05272815881236907
0.7360122856856917
Epoch 141/200, Loss: 0.05098724016739476
0.7419326425262688
Epoch 151/200, Loss: 0.049533627446620696
0.7360950301331779
Epoch 161/200, Loss: 0.04788035022154931
0.73968747

[I 2024-01-21 08:17:22,428] Trial 20 finished with value: 0.7467932070238312 and parameters: {'hidden_dim_h': 29, 'dropout': 0.20553915040461257, 'batch_size': 650}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.28003664977020687
0.5552219652248255
Epoch 11/200, Loss: 0.1855892731083764
0.6416127912281614
Epoch 21/200, Loss: 0.15213036603397792
0.6601479907443997
Epoch 31/200, Loss: 0.12287807199690078
0.6754550831315059
Epoch 41/200, Loss: 0.10085809462600284
0.6880314609356037
Epoch 51/200, Loss: 0.08498620142539343
0.7074758214843084
Epoch 61/200, Loss: 0.07458736971020699
0.7104078853379713
Epoch 71/200, Loss: 0.06695933764179547
0.7234920116951906
Epoch 81/200, Loss: 0.06217751411928071
0.7283328381113356
Epoch 91/200, Loss: 0.05867801300353474
0.73779287089705
Epoch 101/200, Loss: 0.05589523075355424
0.7423227462047743
Epoch 111/200, Loss: 0.05318925057848294
0.7402981404918755
Epoch 121/200, Loss: 0.05155434037248294
0.74102148746581
Epoch 131/200, Loss: 0.05006329243381818
0.7417065249945549
Epoch 141/200, Loss: 0.05120938445130984
0.7249508189132623
Epoch 151/200, Loss: 0.04741575734482871
0.7411999387598318
Epoch 161/200, Loss: 0.04622197813457913
0.7402046628386

[I 2024-01-21 08:18:25,239] Trial 21 finished with value: 0.7512027376190267 and parameters: {'hidden_dim_h': 21, 'dropout': 0.13123187633377686, 'batch_size': 450}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.6594691667705774
0.5647798381901916
Epoch 11/200, Loss: 0.2946661994792521
0.617132576598766
Epoch 21/200, Loss: 0.2262791944667697
0.6428084193342439
Epoch 31/200, Loss: 0.20543338730931282
0.6614046558370605
Epoch 41/200, Loss: 0.1835908107459545
0.66882847152861
Epoch 51/200, Loss: 0.1597145050764084
0.6850307612852052
Epoch 61/200, Loss: 0.13722584769129753
0.6839193655793296
Epoch 71/200, Loss: 0.11741970432922244
0.7143167273051957
Epoch 81/200, Loss: 0.10150943463668227
0.7150564821064143
Epoch 91/200, Loss: 0.08815594553016126
0.7241429327641552
Epoch 101/200, Loss: 0.07675136555917561
0.7293069061148258
Epoch 111/200, Loss: 0.0689933969406411
0.736145327387026
Epoch 121/200, Loss: 0.06176702806260437
0.7425983339890536
Epoch 131/200, Loss: 0.056846028892323375
0.7501224540620587
Epoch 141/200, Loss: 0.053546470939181745
0.7455038419762219
Epoch 151/200, Loss: 0.05114833568222821
0.7522230096280809
Epoch 161/200, Loss: 0.051013907068409026
0.749376874942867

[I 2024-01-21 08:19:24,165] Trial 22 finished with value: 0.7522230096280809 and parameters: {'hidden_dim_h': 19, 'dropout': 0.1368866336139898, 'batch_size': 643}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.8104717096974773
0.568862548221567
Epoch 11/200, Loss: 0.3098577876244822
0.6492163600041827
Epoch 21/200, Loss: 0.16245499637819105
0.6654075344564562
Epoch 31/200, Loss: 0.13021738851262676
0.6811560361765142
Epoch 41/200, Loss: 0.11938855508642812
0.6989821267131393
Epoch 51/200, Loss: 0.10939562681221193
0.7098431452509951
Epoch 61/200, Loss: 0.09870742838228902
0.7168052776068417
Epoch 71/200, Loss: 0.08881966361115055
0.7252052413011668
Epoch 81/200, Loss: 0.07875846590726607
0.7327273695007285
Epoch 91/200, Loss: 0.06924907767003582
0.7363880158761833
Epoch 101/200, Loss: 0.061254296331636364
0.7391755379103984
Epoch 111/200, Loss: 0.053913903572866996
0.7305838594241264
Epoch 121/200, Loss: 0.04721668819265981
0.7431122536959475
Epoch 131/200, Loss: 0.04146215307616418
0.741766354834839
Epoch 141/200, Loss: 0.03793461752995368
0.7495801969157192
Epoch 151/200, Loss: 0.034834291004846175
0.735811991889341
Epoch 161/200, Loss: 0.031575742448049206
0.739038450

[I 2024-01-21 08:20:27,238] Trial 23 finished with value: 0.7495801969157192 and parameters: {'hidden_dim_h': 29, 'dropout': 0.05390842597891558, 'batch_size': 652}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.20484124563443354
0.5784454467632744
Epoch 11/200, Loss: 0.12602418842606056
0.6463217915180498
Epoch 21/200, Loss: 0.09790070125689873
0.6596337796391867
Epoch 31/200, Loss: 0.08668824524069443
0.6833354559464913
Epoch 41/200, Loss: 0.08005925812400304
0.6947587370970282
Epoch 51/200, Loss: 0.07669713362478293
0.7055684714060384
Epoch 61/200, Loss: 0.07342334960897763
0.7124534289203994
Epoch 71/200, Loss: 0.06912754065333268
0.724943563671144
Epoch 81/200, Loss: 0.06604055960017902
0.7291097687909187
Epoch 91/200, Loss: 0.063381913332985
0.7241583246738491
Epoch 101/200, Loss: 0.060999423217697024
0.7315151515004711
Epoch 111/200, Loss: 0.058378612431578145
0.7331021321561024
Epoch 121/200, Loss: 0.05737282450382526
0.7336178920050512
Epoch 131/200, Loss: 0.05521860761711231
0.7372618369502185
Epoch 141/200, Loss: 0.053533987452586494
0.741650844022625
Epoch 151/200, Loss: 0.052913413502466984
0.7381134324668482
Epoch 161/200, Loss: 0.04993710958231718
0.74345634

[I 2024-01-21 08:21:45,898] Trial 24 finished with value: 0.7466009297561322 and parameters: {'hidden_dim_h': 18, 'dropout': 0.13184722814394612, 'batch_size': 259}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.0301512815058231
0.5263210470173747
Epoch 11/200, Loss: 0.450645606033504
0.5984479761748314
Epoch 21/200, Loss: 0.26911368500441313
0.6179109840366477
Epoch 31/200, Loss: 0.22439678898081183
0.6403987055803151
Epoch 41/200, Loss: 0.20623587630689144
0.6471715636987623
Epoch 51/200, Loss: 0.18930165516212583
0.6576239694721521
Epoch 61/200, Loss: 0.17111751856282353
0.6682648934596536
Epoch 71/200, Loss: 0.15343263326212764
0.6792246877503961
Epoch 81/200, Loss: 0.13586926367133856
0.6820234123961376
Epoch 91/200, Loss: 0.1200896070804447
0.6874796098812612
Epoch 101/200, Loss: 0.10535843204706907
0.7058586233215698
Epoch 111/200, Loss: 0.09425020543858409
0.7169289385531564
Epoch 121/200, Loss: 0.08389983791857958
0.7022597718810072
Epoch 131/200, Loss: 0.07637686701491475
0.7097398203277105
Epoch 141/200, Loss: 0.07081640756223351
0.7295854678324933
Epoch 151/200, Loss: 0.06644943309947848
0.7290697843346324
Epoch 161/200, Loss: 0.06277301488444209
0.733473719405

[I 2024-01-21 08:22:42,170] Trial 25 finished with value: 0.74049511650429 and parameters: {'hidden_dim_h': 14, 'dropout': 0.18939623176178055, 'batch_size': 626}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.470657748394999
0.5746298925068644
Epoch 11/200, Loss: 0.25102469736132127
0.6338929090259261
Epoch 21/200, Loss: 0.21328637260815192
0.653989359643362
Epoch 31/200, Loss: 0.18904758887044315
0.6642898130408319
Epoch 41/200, Loss: 0.16352269824208884
0.6722181875667345
Epoch 51/200, Loss: 0.14075826159838972
0.6890574608570963
Epoch 61/200, Loss: 0.118821883509899
0.7000541080949513
Epoch 71/200, Loss: 0.10089382066808898
0.7137210350186284
Epoch 81/200, Loss: 0.08472959388946665
0.7290430100120695
Epoch 91/200, Loss: 0.0724026627581695
0.7261032613197194
Epoch 101/200, Loss: 0.06252911776818078
0.7330285816563886
Epoch 111/200, Loss: 0.05570559100858096
0.7372169918886167
Epoch 121/200, Loss: 0.050324940732840835
0.7422680463037132
Epoch 131/200, Loss: 0.04733116950454383
0.7387598075997988
Epoch 141/200, Loss: 0.04278385459349073
0.7385272506433301
Epoch 151/200, Loss: 0.04096828786463573
0.7475098841460783
Epoch 161/200, Loss: 0.03946344284661885
0.7405271792871

[I 2024-01-21 08:23:44,778] Trial 26 finished with value: 0.7488943460956162 and parameters: {'hidden_dim_h': 27, 'dropout': 0.1113774793579, 'batch_size': 708}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.32508469621340436
0.5758258048842243
Epoch 11/200, Loss: 0.23462515821059546
0.6219239130926549
Epoch 21/200, Loss: 0.17880310490727425
0.6506588975496413
Epoch 31/200, Loss: 0.14135652325219578
0.6601307296891414
Epoch 41/200, Loss: 0.11373793540729417
0.6708058953689454
Epoch 51/200, Loss: 0.09731989146934615
0.6895871261292216
Epoch 61/200, Loss: 0.08530982294016415
0.6921762725103023
Epoch 71/200, Loss: 0.07894441154268053
0.7064427891419971
Epoch 81/200, Loss: 0.07295462903049257
0.7169752173370353
Epoch 91/200, Loss: 0.06823877721197075
0.7142045304795496
Epoch 101/200, Loss: 0.06600676539043586
0.7254120790494373
Epoch 111/200, Loss: 0.06426490201718277
0.7303318159194807
Epoch 121/200, Loss: 0.06151642308880886
0.7315681240486901
Epoch 131/200, Loss: 0.06095070909294817
0.7332330826954785
Epoch 141/200, Loss: 0.0580918797188335
0.7406640634147832
Epoch 151/200, Loss: 0.05692303874012497
0.741429850181149
Epoch 161/200, Loss: 0.0553117481370767
0.73842501222

[I 2024-01-21 08:24:45,093] Trial 27 finished with value: 0.741429850181149 and parameters: {'hidden_dim_h': 20, 'dropout': 0.2288315746595384, 'batch_size': 559}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.448484507890848
0.47179563953193404
Epoch 11/200, Loss: 0.8795662304529777
0.02888469782886647
Epoch 21/200, Loss: 0.36815803154156757
0.03687837395023739
Epoch 31/200, Loss: 0.2641741768098794
0.03793371340246447
Epoch 41/200, Loss: 0.25278559527718103
0.054333968483877455
Epoch 51/200, Loss: 0.25195103453902096
0.05833756837981589
Epoch 61/200, Loss: 0.2527320215908381
0.04259616729625677
Epoch 71/200, Loss: 0.25355382091723955
0.03281086049157052
Epoch 81/200, Loss: 0.25556387351109433
0.05228983833428806
Epoch 91/200, Loss: 0.2544342651963234
0.038716868811673376
Epoch 101/200, Loss: 0.2551279285779366
0.03428511529253354
Epoch 111/200, Loss: 0.2530952012882783
0.03526557679549429
Epoch 121/200, Loss: 0.252727585629775
0.05119867534764913
Epoch 131/200, Loss: 0.25388834081017053
0.019449741316877548
Epoch 141/200, Loss: 0.2586804198531004
0.015591800906560694
Epoch 151/200, Loss: 0.2560312914160582
0.019165221475411977
Epoch 161/200, Loss: 0.2506282077385829
0.

[I 2024-01-21 08:26:01,346] Trial 28 finished with value: 0.47179563953193404 and parameters: {'hidden_dim_h': 35, 'dropout': 0.14715707696223257, 'batch_size': 389}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.5346471087800132
0.5347371600828116
Epoch 11/200, Loss: 0.26417171789540184
0.602332323740094
Epoch 21/200, Loss: 0.1573326140642166
0.6453041401156433
Epoch 31/200, Loss: 0.12170739885833529
0.6641152647899968
Epoch 41/200, Loss: 0.11023107378019227
0.6718594139545431
Epoch 51/200, Loss: 0.1035782326426771
0.6838657722915088
Epoch 61/200, Loss: 0.09956039860844612
0.6940513133962383
Epoch 71/200, Loss: 0.09472860644261043
0.7057382582743029
Epoch 81/200, Loss: 0.09085455785195033
0.7158624939987601
Epoch 91/200, Loss: 0.0864673981236087
0.7168198097447299
Epoch 101/200, Loss: 0.08255328527755207
0.7206271285754361
Epoch 111/200, Loss: 0.07768744230270386
0.7232344968215326
Epoch 121/200, Loss: 0.07444287464022636
0.7256963614789569
Epoch 131/200, Loss: 0.07136910325951046
0.7312995058613017
Epoch 141/200, Loss: 0.06774706641832988
0.735962375656762
Epoch 151/200, Loss: 0.06595452626546223
0.7390377218742529
Epoch 161/200, Loss: 0.06259490984181564
0.73718471684960

[I 2024-01-21 08:26:56,463] Trial 29 finished with value: 0.7416850611015668 and parameters: {'hidden_dim_h': 18, 'dropout': 0.1890318601583572, 'batch_size': 1130}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.33410378563694837
0.5687359777839827
Epoch 11/200, Loss: 0.19628981191937517
0.6388595632300436
Epoch 21/200, Loss: 0.16846826999652675
0.6584280600615725
Epoch 31/200, Loss: 0.14131218776470278
0.6675987414159744
Epoch 41/200, Loss: 0.11646668685645592
0.6874896889149961
Epoch 51/200, Loss: 0.09581519099997311
0.6991241687639393
Epoch 61/200, Loss: 0.07980243861675262
0.7145224394268581
Epoch 71/200, Loss: 0.06961191282039736
0.7218174211772695
Epoch 81/200, Loss: 0.06374851786872236
0.7288628330766634
Epoch 91/200, Loss: 0.056242737373927744
0.7410144054636179
Epoch 101/200, Loss: 0.05113702839831027
0.7443994005039652
Epoch 111/200, Loss: 0.052049669641547086
0.7354795120037967
Epoch 121/200, Loss: 0.045666614683662975
0.7456175711711359
Epoch 131/200, Loss: 0.041928252704986714
0.7486848440276281
Epoch 141/200, Loss: 0.04079660109993888
0.7470461558439262
Epoch 151/200, Loss: 0.03865089939861763
0.7416186377381975
Epoch 161/200, Loss: 0.037365620910394484
0.750

[I 2024-01-21 08:28:04,451] Trial 30 finished with value: 0.7544272720341877 and parameters: {'hidden_dim_h': 32, 'dropout': 0.07633750945244452, 'batch_size': 490}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.3444235244902169
0.5779814732148917
Epoch 11/200, Loss: 0.23071740713061356
0.6420340233025007
Epoch 21/200, Loss: 0.17561532702387833
0.6583025539785784
Epoch 31/200, Loss: 0.13495305471303987
0.6738693496920117
Epoch 41/200, Loss: 0.10544344219492703
0.6976215784781594
Epoch 51/200, Loss: 0.08586916054894285
0.7076484622077349
Epoch 61/200, Loss: 0.07130582467084978
0.7144970818590957
Epoch 71/200, Loss: 0.06290763062311382
0.7284638970623797
Epoch 81/200, Loss: 0.055724081015441476
0.7219295325089398
Epoch 91/200, Loss: 0.05149697730454003
0.728107240796818
Epoch 101/200, Loss: 0.047147466006075466
0.7373035279674108
Epoch 111/200, Loss: 0.04441307121660651
0.7326896986200718
Epoch 121/200, Loss: 0.041330815270179656
0.7333433906682609
Epoch 131/200, Loss: 0.03981628514281133
0.7374726028385402
Epoch 141/200, Loss: 0.03788348014761762
0.7288730145428771
Epoch 151/200, Loss: 0.036406765623790464
0.7343427860878197
Epoch 161/200, Loss: 0.03435177714904634
0.735684

[I 2024-01-21 08:29:16,239] Trial 31 finished with value: 0.7374726028385402 and parameters: {'hidden_dim_h': 33, 'dropout': 0.07064269110527037, 'batch_size': 495}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.7199532389640808
0.575732412841672
Epoch 11/200, Loss: 0.20000117673323706
0.6341914204584351
Epoch 21/200, Loss: 0.11041766748978542
0.6765255872654891
Epoch 31/200, Loss: 0.09842694340608059
0.6926460750074516
Epoch 41/200, Loss: 0.09348587214182584
0.6959381339947163
Epoch 51/200, Loss: 0.08428247425800715
0.7124032932199768
Epoch 61/200, Loss: 0.07751060143495217
0.7202121197097201
Epoch 71/200, Loss: 0.07180468718975018
0.7186932264109379
Epoch 81/200, Loss: 0.06464641054089253
0.714556234745349
Epoch 91/200, Loss: 0.05939134372732578
0.7343697900658029
Epoch 101/200, Loss: 0.0546884111677989
0.7363142239696694
Epoch 111/200, Loss: 0.04977203189180447
0.7427909679151405
Epoch 121/200, Loss: 0.046847316794670545
0.7381100343667639
Epoch 131/200, Loss: 0.04366351625858209
0.7372868584385188
Epoch 141/200, Loss: 0.040845335580599614
0.7383162461613345
Epoch 151/200, Loss: 0.039527020584314294
0.7372138098422925
Epoch 161/200, Loss: 0.03740698920610624
0.743594711

[I 2024-01-21 08:30:29,985] Trial 32 finished with value: 0.7456794824036879 and parameters: {'hidden_dim_h': 40, 'dropout': 0.11473925915853198, 'batch_size': 514}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.246525337850606
0.5829133165586243
Epoch 11/200, Loss: 0.12421676921255795
0.6573791095332997
Epoch 21/200, Loss: 0.09926988000487104
0.6791250042761945
Epoch 31/200, Loss: 0.08266467978189021
0.695477873488585
Epoch 41/200, Loss: 0.07359223375901763
0.7036934110404259
Epoch 51/200, Loss: 0.06745898397064504
0.7150601501175563
Epoch 61/200, Loss: 0.06246112802146393
0.7188013942782058
Epoch 71/200, Loss: 0.057834231191211276
0.7267332479898487
Epoch 81/200, Loss: 0.05469945068528623
0.7280184892070297
Epoch 91/200, Loss: 0.051150846766468916
0.7331381811788024
Epoch 101/200, Loss: 0.04835073576297289
0.7318859177249364
Epoch 111/200, Loss: 0.046650313346842186
0.7311616103206485
Epoch 121/200, Loss: 0.04382203077828443
0.7340381715889954
Epoch 131/200, Loss: 0.04119054011908578
0.730716948365562
Epoch 141/200, Loss: 0.0397336861739556
0.7275275472159672
Epoch 151/200, Loss: 0.03771741706647991
0.7297674939102103
Epoch 161/200, Loss: 0.03679194487631321
0.7357472704

[I 2024-01-21 08:31:54,461] Trial 33 finished with value: 0.737678485191724 and parameters: {'hidden_dim_h': 29, 'dropout': 0.07359845607334421, 'batch_size': 247}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.7265869264419262
0.5514734683640807
Epoch 11/200, Loss: 0.4893422768666194
0.6188706632245078
Epoch 21/200, Loss: 0.1647673101665882
0.6512793215840316
Epoch 31/200, Loss: 0.114055724384693
0.6845216492464602
Epoch 41/200, Loss: 0.1031785889600332
0.70316040242147
Epoch 51/200, Loss: 0.09389832415259801
0.7171968349567887
Epoch 61/200, Loss: 0.08642408208778271
0.7167382576388504
Epoch 71/200, Loss: 0.07583237983859502
0.720331047497238
Epoch 81/200, Loss: 0.06700579750423248
0.7304139716373824
Epoch 91/200, Loss: 0.0599073595725573
0.740416213947644
Epoch 101/200, Loss: 0.054026149141673856
0.7403419607282953
Epoch 111/200, Loss: 0.04899625272418444
0.7443429014522286
Epoch 121/200, Loss: 0.04580301812921579
0.7448243019270112
Epoch 131/200, Loss: 0.043812661861570984
0.7471577667142585
Epoch 141/200, Loss: 0.0419716051278206
0.7426766449670581
Epoch 151/200, Loss: 0.0402299900037738
0.7524321004360961
Epoch 161/200, Loss: 0.039134753903803915
0.7469760766862035
E

[I 2024-01-21 08:33:01,365] Trial 34 finished with value: 0.7524654283343939 and parameters: {'hidden_dim_h': 23, 'dropout': 0.09561378153779969, 'batch_size': 386}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.22917804840419972
0.5819084935454549
Epoch 11/200, Loss: 0.13212520735604422
0.647883186766124
Epoch 21/200, Loss: 0.10671138617077044
0.6549679064384103
Epoch 31/200, Loss: 0.08847679277615887
0.6858013120032211
Epoch 41/200, Loss: 0.07884910476527043
0.7009003530611189
Epoch 51/200, Loss: 0.07149616708712918
0.715595640834154
Epoch 61/200, Loss: 0.06466402718797326
0.7260570923697445
Epoch 71/200, Loss: 0.06042594914989812
0.7390418020445852
Epoch 81/200, Loss: 0.057225659023970366
0.7326844637807159
Epoch 91/200, Loss: 0.05318738826151405
0.7410101303027176
Epoch 101/200, Loss: 0.050279481269951375
0.7439429978908625
Epoch 111/200, Loss: 0.048738905627812655
0.7410480338132123
Epoch 121/200, Loss: 0.04729517549276352
0.7410015197165726
Epoch 131/200, Loss: 0.044583962099360566
0.7422268355322176
Epoch 141/200, Loss: 0.04271214575107608
0.7403645850953455
Epoch 151/200, Loss: 0.04202780253919108
0.7377313594214226
Epoch 161/200, Loss: 0.04090164388929095
0.742624

[I 2024-01-21 08:34:10,194] Trial 35 finished with value: 0.747543768341806 and parameters: {'hidden_dim_h': 23, 'dropout': 0.09762977320462689, 'batch_size': 361}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.2239660984621598
0.5912771456052894
Epoch 11/200, Loss: 0.12061280828828995
0.6532453868916768
Epoch 21/200, Loss: 0.09347241887679467
0.6690202687467309
Epoch 31/200, Loss: 0.08053586352616549
0.6850163938919924
Epoch 41/200, Loss: 0.07374011091171549
0.7139919147622648
Epoch 51/200, Loss: 0.07193201723007056
0.7054673659407755
Epoch 61/200, Loss: 0.06682872224169281
0.7160278884968418
Epoch 71/200, Loss: 0.06513141898008493
0.725848732503565
Epoch 81/200, Loss: 0.06058665522589134
0.731797017037816
Epoch 91/200, Loss: 0.05867506370234948
0.7351255585914817
Epoch 101/200, Loss: 0.05695663815220961
0.7270621774452171
Epoch 111/200, Loss: 0.053964135523598925
0.7229346695258183
Epoch 121/200, Loss: 0.053710969344068035
0.73187881048904
Epoch 131/200, Loss: 0.05291017392077125
0.7374263045779258
Epoch 141/200, Loss: 0.04899556479918269
0.7357721385884177
Epoch 151/200, Loss: 0.05366837990900072
0.7411385244629095
Epoch 161/200, Loss: 0.04772626209216049
0.72873346887

[I 2024-01-21 08:35:47,575] Trial 36 finished with value: 0.7411385244629095 and parameters: {'hidden_dim_h': 37, 'dropout': 0.0720083222030652, 'batch_size': 194}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.48041922297883544
0.5874446956993774
Epoch 11/200, Loss: 0.2285745920653039
0.6229547292635716
Epoch 21/200, Loss: 0.19063277669409487
0.6471476884130996
Epoch 31/200, Loss: 0.15731886948676818
0.6507955313267205
Epoch 41/200, Loss: 0.12882678115621526
0.6671403497008054
Epoch 51/200, Loss: 0.11060062795877457
0.6754476050720836
Epoch 61/200, Loss: 0.09332468107025674
0.6850030329902598
Epoch 71/200, Loss: 0.08377318971968711
0.7005754255107776
Epoch 81/200, Loss: 0.07646016031503677
0.7083319769256566
Epoch 91/200, Loss: 0.07217947274763534
0.7116257489992265
Epoch 101/200, Loss: 0.06975656676482647
0.7107331675437842
Epoch 111/200, Loss: 0.0671015018002784
0.7218724156185671
Epoch 121/200, Loss: 0.06502799285536116
0.7248720070986894
Epoch 131/200, Loss: 0.06246432669936342
0.7347475737925515
Epoch 141/200, Loss: 0.061065910106643716
0.7238698985123388
Epoch 151/200, Loss: 0.059479007774845084
0.7275054890589796
Epoch 161/200, Loss: 0.05778535756659001
0.73269410

[I 2024-01-21 08:36:55,122] Trial 37 finished with value: 0.7352462485357811 and parameters: {'hidden_dim_h': 27, 'dropout': 0.3369908175918661, 'batch_size': 426}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.42397493669684505
0.5859876466175865
Epoch 11/200, Loss: 0.25801118473771595
0.001473579458720898
Epoch 21/200, Loss: 0.2574917493571698
0.03238501597161026
Epoch 31/200, Loss: 0.2549295983683895
0.01666133685579605
Epoch 41/200, Loss: 0.2540896329241739
0.027072868164097316
Epoch 51/200, Loss: 0.25337091298170494
0.02711206743075113
Epoch 61/200, Loss: 0.2505675035883004
0.027749196933532397
Epoch 71/200, Loss: 0.24811180922347056
0.03821013017737177
Epoch 81/200, Loss: 0.24793282277147535
0.047111704736867745
Epoch 91/200, Loss: 0.25046946758955296
0.042497708915033794
Epoch 101/200, Loss: 0.2515114556315919
0.03196960393907236
Epoch 111/200, Loss: 0.24871137486377232
0.043952796161625875
Epoch 121/200, Loss: 0.24771828046986755
0.06572475024844261
Epoch 131/200, Loss: 0.24426486332651595
0.07088949251628233
Epoch 141/200, Loss: 0.25319437955466795
0.03810169199659927
Epoch 151/200, Loss: 0.25130000668512265
0.014243181329068533
Epoch 161/200, Loss: 0.25128733838

[I 2024-01-21 08:38:18,537] Trial 38 finished with value: 0.5859876466175865 and parameters: {'hidden_dim_h': 34, 'dropout': 0.0888572041857, 'batch_size': 285}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.1875980365567091
0.5494586456494768
Epoch 11/200, Loss: 0.4525992470543559
0.6330477812813099
Epoch 21/200, Loss: 0.2711927898046447
0.6568817516558673
Epoch 31/200, Loss: 0.23158445409158382
0.6586998197977806
Epoch 41/200, Loss: 0.20836878004597453
0.6718939730128861
Epoch 51/200, Loss: 0.18376364213664356
0.6762711179545157
Epoch 61/200, Loss: 0.15768509630749866
0.6917654195003088
Epoch 71/200, Loss: 0.13296342423049415
0.6985057241485788
Epoch 81/200, Loss: 0.1098864907171668
0.7166006433339587
Epoch 91/200, Loss: 0.09066212468030976
0.7255967710453815
Epoch 101/200, Loss: 0.07477371649044316
0.7334745829706121
Epoch 111/200, Loss: 0.06365379109615232
0.7345237371413391
Epoch 121/200, Loss: 0.05437419000195294
0.7443459707026141
Epoch 131/200, Loss: 0.048007862960420006
0.7387745024962304
Epoch 141/200, Loss: 0.04326750229044658
0.7489249602619362
Epoch 151/200, Loss: 0.040924373105531785
0.7469873409109943
Epoch 161/200, Loss: 0.038797407978918494
0.750044600

[I 2024-01-21 08:39:26,076] Trial 39 finished with value: 0.7548695181129738 and parameters: {'hidden_dim_h': 31, 'dropout': 0.10675710357313072, 'batch_size': 498}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.42638593673706054
0.5702407124372
Epoch 11/200, Loss: 0.2320810651779175
0.6401385913744247
Epoch 21/200, Loss: 0.19643722236156463
0.649512017154132
Epoch 31/200, Loss: 0.18223159909248351
0.655362485579545
Epoch 41/200, Loss: 0.16760989725589753
0.6630375393603283
Epoch 51/200, Loss: 0.15254664421081543
0.6716722907823115
Epoch 61/200, Loss: 0.1376742935180664
0.6835223918635304
Epoch 71/200, Loss: 0.12337966561317444
0.6918602467228196
Epoch 81/200, Loss: 0.10978035360574723
0.6952633216434745
Epoch 91/200, Loss: 0.09738602072000503
0.7075843564943834
Epoch 101/200, Loss: 0.08774363577365875
0.7073416137615901
Epoch 111/200, Loss: 0.0787650254368782
0.7221760393725487
Epoch 121/200, Loss: 0.07090308487415314
0.7197931061294317
Epoch 131/200, Loss: 0.06567492380738259
0.7305944687884736
Epoch 141/200, Loss: 0.06141968160867691
0.7356430602365583
Epoch 151/200, Loss: 0.05744821190834046
0.7390406259160499
Epoch 161/200, Loss: 0.05425860941410065
0.7348150717018422

[I 2024-01-21 08:40:35,972] Trial 40 finished with value: 0.7448196862149702 and parameters: {'hidden_dim_h': 40, 'dropout': 0.26169178592892184, 'batch_size': 819}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.4346859482201664
0.553663061729754
Epoch 11/200, Loss: 0.4526671746915037
0.6152741015805154
Epoch 21/200, Loss: 0.17101258784532547
0.6631691561893747
Epoch 31/200, Loss: 0.11788321303373034
0.687313351424679
Epoch 41/200, Loss: 0.10570342296903784
0.7040539417975448
Epoch 51/200, Loss: 0.09743128242817792
0.7134446423926512
Epoch 61/200, Loss: 0.08904775062745268
0.7260154019039913
Epoch 71/200, Loss: 0.08080582371489568
0.7335090576990273
Epoch 81/200, Loss: 0.0711265979334712
0.7444592807963138
Epoch 91/200, Loss: 0.064329852942716
0.7389494841584743
Epoch 101/200, Loss: 0.05722735966132446
0.7460628571023662
Epoch 111/200, Loss: 0.051140051927756176
0.7498563429089231
Epoch 121/200, Loss: 0.04763972369784659
0.7447859948896347
Epoch 131/200, Loss: 0.042972627519206566
0.7410847899423266
Epoch 141/200, Loss: 0.040976595556871456
0.7420047010828159
Epoch 151/200, Loss: 0.038796748711981556
0.7473914462935761
Epoch 161/200, Loss: 0.037654104981232776
0.7511658773

[I 2024-01-21 08:41:45,425] Trial 41 finished with value: 0.7511658773099594 and parameters: {'hidden_dim_h': 31, 'dropout': 0.11007720129385917, 'batch_size': 462}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.19425356914015376
0.5837356755528182
Epoch 11/200, Loss: 0.1331429044697799
0.6496146880825278
Epoch 21/200, Loss: 0.10474826760736167
0.6638178647853364
Epoch 31/200, Loss: 0.09025163656356287
0.6839096656054852
Epoch 41/200, Loss: 0.08027518986194741
0.6852727369499328
Epoch 51/200, Loss: 0.07632334150520026
0.7044935053928046
Epoch 61/200, Loss: 0.06946808720628421
0.7256985948760121
Epoch 71/200, Loss: 0.06562770757020689
0.7210196820191167
Epoch 81/200, Loss: 0.0605866529193579
0.7296673392389943
Epoch 91/200, Loss: 0.058818917283240485
0.7283920749147708
Epoch 101/200, Loss: 0.05431377646677634
0.73488870628278
Epoch 111/200, Loss: 0.05128413862457462
0.7438209515562152
Epoch 121/200, Loss: 0.04970803352839807
0.7445254644409636
Epoch 131/200, Loss: 0.04784276803918913
0.7438851047517192
Epoch 141/200, Loss: 0.045514025816730426
0.7388536670360094
Epoch 151/200, Loss: 0.0430332383177444
0.7454197169195317
Epoch 161/200, Loss: 0.04238582256377912
0.74710299415

[I 2024-01-21 08:42:54,223] Trial 42 finished with value: 0.7508412973143755 and parameters: {'hidden_dim_h': 27, 'dropout': 0.09362026844161114, 'batch_size': 399}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.3525909814569685
0.5628398619638998
Epoch 11/200, Loss: 0.5729281389051013
0.6196920556746915
Epoch 21/200, Loss: 0.3055856318937408
0.6523740660217752
Epoch 31/200, Loss: 0.23681960213515493
0.6720987847102516
Epoch 41/200, Loss: 0.2137405164539814
0.6740632337297067
Epoch 51/200, Loss: 0.19426235556602478
0.6887785796830006
Epoch 61/200, Loss: 0.1729783643451002
0.690210891617855
Epoch 71/200, Loss: 0.1517352635661761
0.7163265018170281
Epoch 81/200, Loss: 0.1309070825162861
0.7193044897756617
Epoch 91/200, Loss: 0.11072947250472175
0.7264457793666848
Epoch 101/200, Loss: 0.0931613768140475
0.7307590429860205
Epoch 111/200, Loss: 0.0775429250465499
0.7374395561206076
Epoch 121/200, Loss: 0.06472491886880663
0.7379427727732042
Epoch 131/200, Loss: 0.05381516615549723
0.7410075241134056
Epoch 141/200, Loss: 0.04726399067375395
0.7460381403991965
Epoch 151/200, Loss: 0.04238399501062102
0.7459674774293478
Epoch 161/200, Loss: 0.038087960332632065
0.7396509608592791


[I 2024-01-21 08:44:04,280] Trial 43 finished with value: 0.748258573055922 and parameters: {'hidden_dim_h': 35, 'dropout': 0.12381093581865966, 'batch_size': 564}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.0509419901329173
0.5503294270151826
Epoch 11/200, Loss: 0.24327109440376884
0.639281413032985
Epoch 21/200, Loss: 0.1501910456439905
0.6525005174061688
Epoch 31/200, Loss: 0.13398322763673046
0.6772663520677865
Epoch 41/200, Loss: 0.1189920729712436
0.6944818021994077
Epoch 51/200, Loss: 0.10371402441932444
0.7021270160094312
Epoch 61/200, Loss: 0.08851028103054616
0.7213604587682798
Epoch 71/200, Loss: 0.07686281138867662
0.718575316735715
Epoch 81/200, Loss: 0.06723143696262125
0.7264112978363482
Epoch 91/200, Loss: 0.05957353958173802
0.7378996165648694
Epoch 101/200, Loss: 0.05397467485122513
0.7342242613215314
Epoch 111/200, Loss: 0.052069859154391704
0.7426158288554244
Epoch 121/200, Loss: 0.04869423963521656
0.7410323704817159
Epoch 131/200, Loss: 0.047040294202273354
0.743738305778501
Epoch 141/200, Loss: 0.045796309189315425
0.7437339093981773
Epoch 151/200, Loss: 0.04262568684000718
0.7475084798287986
Epoch 161/200, Loss: 0.04189944777049517
0.74708283387

[I 2024-01-21 08:45:17,601] Trial 44 finished with value: 0.7499035404776955 and parameters: {'hidden_dim_h': 30, 'dropout': 0.15079317643206822, 'batch_size': 352}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.795580886659168
0.44570899812574166
Epoch 11/200, Loss: 1.3022043108940125
0.23104979569659742
Epoch 21/200, Loss: 0.5193850497404734
0.603776970380797
Epoch 31/200, Loss: 0.22802807355210894
0.6558043732157578
Epoch 41/200, Loss: 0.14476251282862254
0.6684732964771989
Epoch 51/200, Loss: 0.12495154195598193
0.6861740461109864
Epoch 61/200, Loss: 0.11708715043607212
0.6953964645562201
Epoch 71/200, Loss: 0.10803262073369253
0.7059035814976625
Epoch 81/200, Loss: 0.10036482484567733
0.7092100605983305
Epoch 91/200, Loss: 0.09267845732115564
0.7149559683194732
Epoch 101/200, Loss: 0.08330842675197692
0.716139802841654
Epoch 111/200, Loss: 0.07498326525092125
0.7323132812462325
Epoch 121/200, Loss: 0.06703359190197218
0.7321384452442885
Epoch 131/200, Loss: 0.06034224365083944
0.7333693193043935
Epoch 141/200, Loss: 0.054119538161016646
0.734818186347911
Epoch 151/200, Loss: 0.049819051509811765
0.7364083497203613
Epoch 161/200, Loss: 0.04676432499573344
0.74796624634

[I 2024-01-21 08:46:21,430] Trial 45 finished with value: 0.7503113820209246 and parameters: {'hidden_dim_h': 23, 'dropout': 0.06494840257482251, 'batch_size': 485}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.4803169635789735
0.5521029704964756
Epoch 11/200, Loss: 0.23677224878753936
0.6309633225889922
Epoch 21/200, Loss: 0.19776910224131175
0.6488425310347684
Epoch 31/200, Loss: 0.17733169187392508
0.6520297797910648
Epoch 41/200, Loss: 0.1573666754577841
0.6702618506651604
Epoch 51/200, Loss: 0.1371661810470479
0.6851310263910209
Epoch 61/200, Loss: 0.11866634977715355
0.6843455253950499
Epoch 71/200, Loss: 0.10261694554771696
0.6993359567926771
Epoch 81/200, Loss: 0.08983057072120053
0.7095166949322582
Epoch 91/200, Loss: 0.08030296808906964
0.6507528514293568
Epoch 101/200, Loss: 0.07127829960414342
0.7196468990507677
Epoch 111/200, Loss: 0.06486282830259629
0.6812364391595681
Epoch 121/200, Loss: 0.06054495035537651
0.6644336334756823
Epoch 131/200, Loss: 0.05669660520340715
0.7321592251001916
Epoch 141/200, Loss: 0.053662686475685666
0.726137072443225
Epoch 151/200, Loss: 0.05227827467024326
0.7405481655451097
Epoch 161/200, Loss: 0.05034650569515569
0.71985123319

[I 2024-01-21 08:47:16,570] Trial 46 finished with value: 0.7440889407834749 and parameters: {'hidden_dim_h': 14, 'dropout': 0.08267054455186268, 'batch_size': 726}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.0387294584391067
0.5247428208559799
Epoch 11/200, Loss: 0.7554689511960867
0.003027399730619249
Epoch 21/200, Loss: 0.3372143221144773
0.0020444027379596954
Epoch 31/200, Loss: 0.26568950986375617
0.004108234933265394
Epoch 41/200, Loss: 0.25658735024685764
0.006290098512701474
Epoch 51/200, Loss: 0.24533204308577947
0.07519451601189972
Epoch 61/200, Loss: 0.2395539907168369
0.11889029304611544
Epoch 71/200, Loss: 0.23845062024739325
0.15456418601005054
Epoch 81/200, Loss: 0.24947993974296415
0.03641503118875607
Epoch 91/200, Loss: 0.24047364872329088
0.13368146699387437
Epoch 101/200, Loss: 0.24331724765349408
0.09110814250784861
Epoch 111/200, Loss: 0.2423257547981885
0.08931136077943894
Epoch 121/200, Loss: 0.2442085128657672
0.0883881434176028
Epoch 131/200, Loss: 0.24214348379446535
0.07930820786787736
Epoch 141/200, Loss: 0.24106364682012674
0.08840789566921725
Epoch 151/200, Loss: 0.24855887524935663
0.05252576369216388
Epoch 161/200, Loss: 0.253351094771404

[I 2024-01-21 08:48:36,479] Trial 47 finished with value: 0.5247428208559799 and parameters: {'hidden_dim_h': 42, 'dropout': 0.1036088280857688, 'batch_size': 415}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.17682994157075882
0.5774967904031639
Epoch 11/200, Loss: 0.12637574751587474
0.6451549605412904
Epoch 21/200, Loss: 0.10582613682045657
0.6686172286318895
Epoch 31/200, Loss: 0.09239464012138984
0.6812560745770233
Epoch 41/200, Loss: 0.08234025012044345
0.6950489041243615
Epoch 51/200, Loss: 0.07480398017693968
0.7028289882200948
Epoch 61/200, Loss: 0.06924620007767397
0.7236874558569414
Epoch 71/200, Loss: 0.06360661808182211
0.7313350386388955
Epoch 81/200, Loss: 0.06008615399546483
0.7360556409245519
Epoch 91/200, Loss: 0.05691153238363126
0.7415576954089048
Epoch 101/200, Loss: 0.053839338943362236
0.7423329910934757
Epoch 111/200, Loss: 0.051188377663493156
0.7440559834785115
Epoch 121/200, Loss: 0.04943102324271903
0.7474002219991235
Epoch 131/200, Loss: 0.04707165084340993
0.7515509751680765
Epoch 141/200, Loss: 0.04563825873329359
0.747805910855212
Epoch 151/200, Loss: 0.04528870608876733
0.7446940787095032
Epoch 161/200, Loss: 0.04309437423944473
0.7486106

[I 2024-01-21 08:49:39,688] Trial 48 finished with value: 0.7515509751680765 and parameters: {'hidden_dim_h': 25, 'dropout': 0.1218327579233456, 'batch_size': 599}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.868794141356478
0.5444834852676438
Epoch 11/200, Loss: 0.10545549249833393
0.6569985096752322
Epoch 21/200, Loss: 0.09349536311995123
0.6742873919208048
Epoch 31/200, Loss: 0.08618042479778074
0.6836582367504405
Epoch 41/200, Loss: 0.08197021357638319
0.7059626870127748
Epoch 51/200, Loss: 0.07570130339602835
0.7087863052795305
Epoch 61/200, Loss: 0.07350871358642873
0.7047909776873232
Epoch 71/200, Loss: 0.06933046693039924
0.7036796352893946
Epoch 81/200, Loss: 0.07032884868610766
0.7166047718778402
Epoch 91/200, Loss: 0.06534320811174579
0.7188822180156892
Epoch 101/200, Loss: 0.07843684028718889
0.7003944743874757
Epoch 111/200, Loss: 0.07567151378571373
0.6941046515224016
Epoch 121/200, Loss: 0.06482390229849472
0.7235624049205435
Epoch 131/200, Loss: 0.0738801782585911
0.7017605607283584
Epoch 141/200, Loss: 0.07923751485716436
0.6763261691710286
Epoch 151/200, Loss: 0.07072509590958811
0.720263873947038
Epoch 161/200, Loss: 0.06958879399852655
0.706833945303

[I 2024-01-21 08:51:12,926] Trial 49 finished with value: 0.7264183776828177 and parameters: {'hidden_dim_h': 38, 'dropout': 0.1522504359665706, 'batch_size': 207}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.1097925528883934
0.5435650981966714
Epoch 11/200, Loss: 0.31057355273514986
0.005961301548273769
Epoch 21/200, Loss: 0.2596840593032539
0.002307002901019116
Epoch 31/200, Loss: 0.2579207965172827
0.0054120168182642085
Epoch 41/200, Loss: 0.2560072364285588
0.010081534914611667
Epoch 51/200, Loss: 0.2555537293665111
0.013636518526523726
Epoch 61/200, Loss: 0.2564631968270987
0.018868900619759252
Epoch 71/200, Loss: 0.25372795830480754
0.025540699255331274
Epoch 81/200, Loss: 0.25329081784002483
0.007243671684569493
Epoch 91/200, Loss: 0.25305810919962823
0.015879261050324167
Epoch 101/200, Loss: 0.254225536249578
0.024053934927224876
Epoch 111/200, Loss: 0.2542034527286887
0.021787721822776863
Epoch 121/200, Loss: 0.25157871400006115
0.023279357958901202
Epoch 131/200, Loss: 0.24898414872586727
0.032991518405041595
Epoch 141/200, Loss: 0.2488037806469947
0.026462283940856174
Epoch 151/200, Loss: 0.24435869324952364
0.04627735560060607
Epoch 161/200, Loss: 0.24383726

[I 2024-01-21 08:52:30,057] Trial 50 finished with value: 0.5435650981966714 and parameters: {'hidden_dim_h': 32, 'dropout': 0.08015473109446722, 'batch_size': 317}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.4111203710238139
0.5495368286907
Epoch 11/200, Loss: 0.24906414945920308
0.6147662947545144
Epoch 21/200, Loss: 0.2157313644886017
0.6236522738576312
Epoch 31/200, Loss: 0.18710061609745027
0.6379082370374566
Epoch 41/200, Loss: 0.15781444509824116
0.6387686677641006
Epoch 51/200, Loss: 0.1380137321849664
0.655608882659831
Epoch 61/200, Loss: 0.1195935145020485
0.664762315706718
Epoch 71/200, Loss: 0.11238887632886568
0.6541573950708229
Epoch 81/200, Loss: 0.09677248497804006
0.678883235042981
Epoch 91/200, Loss: 0.08802517876029015
0.6912457178656718
Epoch 101/200, Loss: 0.08243273670474688
0.6985187199206058
Epoch 111/200, Loss: 0.07647152518232664
0.7034580608608997
Epoch 121/200, Loss: 0.07529785335063935
0.7063770315403176
Epoch 131/200, Loss: 0.07415451978643735
0.7035950399243444
Epoch 141/200, Loss: 0.07070255229870478
0.7210259543635547
Epoch 151/200, Loss: 0.06645892014106115
0.7172020252112845
Epoch 161/200, Loss: 0.06989835699399312
0.7241209698555989
E

[I 2024-01-21 08:53:27,630] Trial 51 finished with value: 0.7293500987767146 and parameters: {'hidden_dim_h': 19, 'dropout': 0.14214919523675984, 'batch_size': 689}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.4083841290022876
0.5671533913009005
Epoch 11/200, Loss: 0.15144969482679624
0.6379424131912261
Epoch 21/200, Loss: 0.13033923748377207
0.6493664865656291
Epoch 31/200, Loss: 0.12035278593366211
0.661743950802075
Epoch 41/200, Loss: 0.10955171045419332
0.671201788730723
Epoch 51/200, Loss: 0.09953343989075841
0.680929835949896
Epoch 61/200, Loss: 0.08984133077634347
0.6900169695421627
Epoch 71/200, Loss: 0.08135292538114496
0.7048444238727966
Epoch 81/200, Loss: 0.07559417470081432
0.7147450735873303
Epoch 91/200, Loss: 0.07033586079204404
0.7202439912637569
Epoch 101/200, Loss: 0.06569826643209199
0.718664249681777
Epoch 111/200, Loss: 0.06306432852068462
0.7254339812227176
Epoch 121/200, Loss: 0.061191425432224535
0.7326227993300832
Epoch 131/200, Loss: 0.05854265653603786
0.7298471552753781
Epoch 141/200, Loss: 0.05764973969072909
0.7360917707394128
Epoch 151/200, Loss: 0.05669789710963095
0.7383612075560961
Epoch 161/200, Loss: 0.05521954132898434
0.737980856627

[I 2024-01-21 08:54:26,390] Trial 52 finished with value: 0.742547235851096 and parameters: {'hidden_dim_h': 16, 'dropout': 0.18348412902166078, 'batch_size': 543}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.7954132944177099
0.5671028778515139
Epoch 11/200, Loss: 0.1850154879739729
0.6124950100430177
Epoch 21/200, Loss: 0.10751509540161844
0.6738484256077918
Epoch 31/200, Loss: 0.08276226548320156
0.6910006974981253
Epoch 41/200, Loss: 0.07546268826571562
0.7156421871742461
Epoch 51/200, Loss: 0.07020276608103412
0.7220361416015517
Epoch 61/200, Loss: 0.0662463436818729
0.733197065023712
Epoch 71/200, Loss: 0.06287180287184688
0.730695718613525
Epoch 81/200, Loss: 0.06021260045005777
0.7348679591375257
Epoch 91/200, Loss: 0.05685741243894491
0.7421266428940797
Epoch 101/200, Loss: 0.05507480262615586
0.7361060686426188
Epoch 111/200, Loss: 0.05229691281325399
0.741619833061005
Epoch 121/200, Loss: 0.0495470008355076
0.7400329509082462
Epoch 131/200, Loss: 0.04878720848447522
0.7453752421329118
Epoch 141/200, Loss: 0.0467059109570448
0.7359470028262489
Epoch 151/200, Loss: 0.04575180171825791
0.7347726647694419
Epoch 161/200, Loss: 0.044000192150726154
0.743257771204113

[I 2024-01-21 08:56:44,798] Trial 53 finished with value: 0.7466385611561601 and parameters: {'hidden_dim_h': 21, 'dropout': 0.0971606392555254, 'batch_size': 113}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.2666992426795118
0.5827395596648642
Epoch 11/200, Loss: 0.19900150903884103
0.6291404794144951
Epoch 21/200, Loss: 0.15497169424505794
0.6513294916231211
Epoch 31/200, Loss: 0.12539593897321644
0.6699102670407064
Epoch 41/200, Loss: 0.10327029863701147
0.683431036482834
Epoch 51/200, Loss: 0.09022890031337738
0.70158336858044
Epoch 61/200, Loss: 0.07687961836071576
0.7077886335234156
Epoch 71/200, Loss: 0.06955041670623947
0.7168926261205614
Epoch 81/200, Loss: 0.06337034450296093
0.7203587080850989
Epoch 91/200, Loss: 0.05850108822478967
0.7229322222241165
Epoch 101/200, Loss: 0.05431977593723465
0.724354829517846
Epoch 111/200, Loss: 0.056896247298401946
0.7183864219814913
Epoch 121/200, Loss: 0.05062277100103743
0.7302356562279566
Epoch 131/200, Loss: 0.04835587980992654
0.7330817503205228
Epoch 141/200, Loss: 0.047129645505372214
0.7315676329863348
Epoch 151/200, Loss: 0.04397833895157365
0.7307189250579335
Epoch 161/200, Loss: 0.04150192165637717
0.73461312115

[I 2024-01-21 08:58:06,170] Trial 54 finished with value: 0.7351712840265059 and parameters: {'hidden_dim_h': 49, 'dropout': 0.12348405930401386, 'batch_size': 594}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.232787148692669
0.5706065205193925
Epoch 11/200, Loss: 0.12722711780896553
0.6327044742095127
Epoch 21/200, Loss: 0.11356697021386562
0.6595819160476787
Epoch 31/200, Loss: 0.10142735430063346
0.6680385192048912
Epoch 41/200, Loss: 0.09052459131448697
0.6884547686786575
Epoch 51/200, Loss: 0.08310672850945057
0.6895452972186125
Epoch 61/200, Loss: 0.07764611689326091
0.7013260190644103
Epoch 71/200, Loss: 0.07526152409040011
0.7070213718480838
Epoch 81/200, Loss: 0.07249642411867778
0.716165734794993
Epoch 91/200, Loss: 0.0702266866962115
0.7194323656524353
Epoch 101/200, Loss: 0.06883401586077152
0.7189046157581372
Epoch 111/200, Loss: 0.06702880675976093
0.7243781874430457
Epoch 121/200, Loss: 0.0657864466118507
0.7297637991032276
Epoch 131/200, Loss: 0.06461742262427624
0.7296835198697503
Epoch 141/200, Loss: 0.06416802117839837
0.7350214856441117
Epoch 151/200, Loss: 0.06269486124316852
0.7306273065025436
Epoch 161/200, Loss: 0.061121758264608875
0.735948364206

[I 2024-01-21 08:59:04,808] Trial 55 finished with value: 0.7388406701804062 and parameters: {'hidden_dim_h': 12, 'dropout': 0.1592377634408174, 'batch_size': 515}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.5290573666925016
0.5791031102015924
Epoch 11/200, Loss: 0.2455870509147644
0.6344252586032474
Epoch 21/200, Loss: 0.20421215535505957
0.6533211104717372
Epoch 31/200, Loss: 0.1678832199262536
0.6619033984247039
Epoch 41/200, Loss: 0.13531676631258882
0.6778630518921188
Epoch 51/200, Loss: 0.10864357180569482
0.6951154055224923
Epoch 61/200, Loss: 0.08940470736959706
0.7056155222301926
Epoch 71/200, Loss: 0.0754917845453905
0.7173778098364734
Epoch 81/200, Loss: 0.0672223217299451
0.7213821967878445
Epoch 91/200, Loss: 0.06039025245801262
0.7265157278456291
Epoch 101/200, Loss: 0.056043150956216065
0.7294983018697052
Epoch 111/200, Loss: 0.053427348723230156
0.7353604206328838
Epoch 121/200, Loss: 0.050013704711328384
0.7350004962570643
Epoch 131/200, Loss: 0.04860827650712884
0.739783569167653
Epoch 141/200, Loss: 0.04559622729278129
0.7350501349658197
Epoch 151/200, Loss: 0.04419053151555683
0.7401515356965774
Epoch 161/200, Loss: 0.04185022575699765
0.73627098394

[I 2024-01-21 09:00:12,389] Trial 56 finished with value: 0.7401515356965774 and parameters: {'hidden_dim_h': 28, 'dropout': 0.13396602543855166, 'batch_size': 440}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.3385639098974376
0.5418272467381804
Epoch 11/200, Loss: 1.3951481672433705
0.5463967929523859
Epoch 21/200, Loss: 0.8320095905890832
0.6068329933473626
Epoch 31/200, Loss: 0.5144895131771381
0.6398446416389824
Epoch 41/200, Loss: 0.355352527820147
0.667756932846147
Epoch 51/200, Loss: 0.28401511907577515
0.6811594067407782
Epoch 61/200, Loss: 0.25276639197881406
0.6904205362325585
Epoch 71/200, Loss: 0.23544101531688982
0.6962725682673756
Epoch 81/200, Loss: 0.22169108173021904
0.701744908416645
Epoch 91/200, Loss: 0.20757408554737383
0.7053403168136558
Epoch 101/200, Loss: 0.19307250816088456
0.7153978949320594
Epoch 111/200, Loss: 0.17759563372685358
0.7182598028878457
Epoch 121/200, Loss: 0.16171660790076622
0.728548733087051
Epoch 131/200, Loss: 0.1463749076311405
0.720903171769701
Epoch 141/200, Loss: 0.13012666255235672
0.7337844330413821
Epoch 151/200, Loss: 0.11502038429562862
0.7376709470648912
Epoch 161/200, Loss: 0.10078410059213638
0.7371804517504044
Ep

[I 2024-01-21 09:01:13,314] Trial 57 finished with value: 0.7429930662749203 and parameters: {'hidden_dim_h': 25, 'dropout': 0.059298949828034284, 'batch_size': 773}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.4328992263130518
0.5350266525053862
Epoch 11/200, Loss: 1.5747289864913276
0.5574781709990151
Epoch 21/200, Loss: 1.015638688336248
0.5984419470998866
Epoch 31/200, Loss: 0.6756754776705867
0.619307149394469
Epoch 41/200, Loss: 0.46283147775608563
0.6313927870459146
Epoch 51/200, Loss: 0.29934145056683087
0.6408433828100002
Epoch 61/200, Loss: 0.22640983954719876
0.6388679112130506
Epoch 71/200, Loss: 0.19364553625169006
0.6505070890262745
Epoch 81/200, Loss: 0.1793300677900729
0.6555445455860361
Epoch 91/200, Loss: 0.17174944799879324
0.6752842530512294
Epoch 101/200, Loss: 0.16492801515952402
0.6688176431380902
Epoch 111/200, Loss: 0.1579902787571368
0.6876533901382813
Epoch 121/200, Loss: 0.14954695947792218
0.6949160416076161
Epoch 131/200, Loss: 0.14116703297780908
0.7054982059764295
Epoch 141/200, Loss: 0.13368830538314322
0.7037146832139727
Epoch 151/200, Loss: 0.12353589061809622
0.7087892658896568
Epoch 161/200, Loss: 0.11611161219037097
0.7185299280577688

[I 2024-01-21 09:02:10,911] Trial 58 finished with value: 0.7271500594641749 and parameters: {'hidden_dim_h': 22, 'dropout': 0.17546986005466814, 'batch_size': 904}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.757239011296055
0.5218506552440743
Epoch 11/200, Loss: 0.9902729663932532
0.5914959921949289
Epoch 21/200, Loss: 0.4247062195811355
0.02326219410163603
Epoch 31/200, Loss: 0.21722474537397685
0.6387683748346497
Epoch 41/200, Loss: 0.1845720154151582
0.6481734612776987
Epoch 51/200, Loss: 0.16624947676533147
0.6680498603293803
Epoch 61/200, Loss: 0.14709856792500145
0.6754900116393906
Epoch 71/200, Loss: 0.12725267872998589
0.6855575755710052
Epoch 81/200, Loss: 0.1071373707892602
0.6996105827949122
Epoch 91/200, Loss: 0.08987747002066228
0.7118441409932467
Epoch 101/200, Loss: 0.07709609599489915
0.7115728794159303
Epoch 111/200, Loss: 0.06766521198707715
0.7286555799677914
Epoch 121/200, Loss: 0.06258428122913628
0.7321935914258847
Epoch 131/200, Loss: 0.05780224404052684
0.7288712178777402
Epoch 141/200, Loss: 0.05469406167404693
0.7342661785744703
Epoch 151/200, Loss: 0.05256480690941476
0.7416990034940929
Epoch 161/200, Loss: 0.05161922496923229
0.7416660227936

[I 2024-01-21 09:03:19,017] Trial 59 finished with value: 0.7475474023139135 and parameters: {'hidden_dim_h': 17, 'dropout': 0.10475881963364661, 'batch_size': 356}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.4480141093333562
0.5838005072805973
Epoch 11/200, Loss: 0.284565377732118
0.6278796060192284
Epoch 21/200, Loss: 0.2443135902285576
0.6404337528358746
Epoch 31/200, Loss: 0.20717861553033193
0.6516739804486844
Epoch 41/200, Loss: 0.172786250213782
0.6624513753378988
Epoch 51/200, Loss: 0.1419094870487849
0.682659335831683
Epoch 61/200, Loss: 0.1158998005092144
0.707735232270471
Epoch 71/200, Loss: 0.09453050047159195
0.7077692718664002
Epoch 81/200, Loss: 0.07805545305212339
0.7236024322853736
Epoch 91/200, Loss: 0.06562245587507884
0.7280051972375398
Epoch 101/200, Loss: 0.05610633293787638
0.7252674839359293
Epoch 111/200, Loss: 0.05042018803457419
0.7404540027289958
Epoch 121/200, Loss: 0.04634214689334234
0.732011059789259
Epoch 131/200, Loss: 0.04243612053493659
0.7375921295156763
Epoch 141/200, Loss: 0.04015593466659387
0.7376384826492421
Epoch 151/200, Loss: 0.039166669671734176
0.7390856472861131
Epoch 161/200, Loss: 0.03726898009578387
0.7330621853923214
E

[I 2024-01-21 09:04:22,109] Trial 60 finished with value: 0.7404540027289958 and parameters: {'hidden_dim_h': 31, 'dropout': 0.13699732442469295, 'batch_size': 672}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.207429578810027
0.533472233926426
Epoch 11/200, Loss: 0.5370409886042277
0.04695549040783539
Epoch 21/200, Loss: 0.2435736326557217
0.619338171500419
Epoch 31/200, Loss: 0.17023995518684387
0.646873774684905
Epoch 41/200, Loss: 0.15340669814384345
0.6583606367913505
Epoch 51/200, Loss: 0.1439826605897961
0.6691829134955422
Epoch 61/200, Loss: 0.1337448236617175
0.6790457541786494
Epoch 71/200, Loss: 0.12378982973821236
0.6878733344082576
Epoch 81/200, Loss: 0.11287471200480606
0.6941429788103194
Epoch 91/200, Loss: 0.10232448487570792
0.702233222762922
Epoch 101/200, Loss: 0.09312236692869302
0.7134069627831292
Epoch 111/200, Loss: 0.08431565242283272
0.7192198215671647
Epoch 121/200, Loss: 0.07756010081731912
0.7224765145022563
Epoch 131/200, Loss: 0.07045995861743436
0.7346495624251178
Epoch 141/200, Loss: 0.06436644968661395
0.7332701584059146
Epoch 151/200, Loss: 0.05990060836528287
0.7361032024233294
Epoch 161/200, Loss: 0.05622153819510431
0.7436794179253609


[I 2024-01-21 09:05:24,489] Trial 61 finished with value: 0.7458421566541931 and parameters: {'hidden_dim_h': 25, 'dropout': 0.12288365971437523, 'batch_size': 612}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.7935866253716606
0.5655540619105359
Epoch 11/200, Loss: 0.8199676990509033
0.6056727203751543
Epoch 21/200, Loss: 0.35374484402792794
0.6392390851673528
Epoch 31/200, Loss: 0.1942056042807443
0.6646754729990338
Epoch 41/200, Loss: 0.1522077488047736
0.6641370631089721
Epoch 51/200, Loss: 0.13997095482689995
0.6811387136228257
Epoch 61/200, Loss: 0.1337190100124904
0.6803447411780835
Epoch 71/200, Loss: 0.12430008862699782
0.6821798170384722
Epoch 81/200, Loss: 0.11614596715995244
0.6966846344579567
Epoch 91/200, Loss: 0.10786769155945097
0.693242911503682
Epoch 101/200, Loss: 0.09781557470560073
0.7017580628557113
Epoch 111/200, Loss: 0.08984416787113463
0.7137876231862644
Epoch 121/200, Loss: 0.08176868238619396
0.7252101420894574
Epoch 131/200, Loss: 0.07510836720466614
0.7086830697167639
Epoch 141/200, Loss: 0.06935207173228264
0.726708383067135
Epoch 151/200, Loss: 0.06386645734310151
0.7291860891596941
Epoch 161/200, Loss: 0.05932625596012388
0.731561129841718

[I 2024-01-21 09:06:25,248] Trial 62 finished with value: 0.7437890653294521 and parameters: {'hidden_dim_h': 24, 'dropout': 0.12245617383409342, 'batch_size': 582}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.20793893075350559
0.5771919218705265
Epoch 11/200, Loss: 0.15933527774883038
0.6389244422272272
Epoch 21/200, Loss: 0.12994036010720514
0.6682365457412646
Epoch 31/200, Loss: 0.10934901824503233
0.6761679802950255
Epoch 41/200, Loss: 0.09266295532385509
0.6925324926945793
Epoch 51/200, Loss: 0.0820231069669579
0.704743083875917
Epoch 61/200, Loss: 0.07289174086216724
0.721925646398332
Epoch 71/200, Loss: 0.06721052346807538
0.7206095806059978
Epoch 81/200, Loss: 0.05993168078588717
0.7344714142503435
Epoch 91/200, Loss: 0.05600921572609381
0.7322548674505799
Epoch 101/200, Loss: 0.053223458429177604
0.729767008646121
Epoch 111/200, Loss: 0.04894825759710687
0.7371942535447257
Epoch 121/200, Loss: 0.046833648374586395
0.7405028554040861
Epoch 131/200, Loss: 0.044525712728500366
0.7386693249744217
Epoch 141/200, Loss: 0.0420419622325536
0.7403443307919673
Epoch 151/200, Loss: 0.041980946831630936
0.7358980384283114
Epoch 161/200, Loss: 0.039690362458879296
0.74461599

[I 2024-01-21 09:07:28,351] Trial 63 finished with value: 0.744615993600436 and parameters: {'hidden_dim_h': 26, 'dropout': 0.08523091502182926, 'batch_size': 621}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.34643701357500895
0.5733143187639029
Epoch 11/200, Loss: 0.20284967621167502
0.6411247196611787
Epoch 21/200, Loss: 0.16315597686029615
0.6507587528623399
Epoch 31/200, Loss: 0.12967201162661826
0.6675342778407442
Epoch 41/200, Loss: 0.10472035762809571
0.699897282504365
Epoch 51/200, Loss: 0.08502680045508203
0.7026129073231966
Epoch 61/200, Loss: 0.07230346490229879
0.7147924969913267
Epoch 71/200, Loss: 0.06396182803880601
0.7163133979938856
Epoch 81/200, Loss: 0.058825235813856125
0.7314539475092451
Epoch 91/200, Loss: 0.05512392166114989
0.7372118097576423
Epoch 101/200, Loss: 0.051894490917523704
0.742960289303992
Epoch 111/200, Loss: 0.0491601884187687
0.7375388807296566
Epoch 121/200, Loss: 0.04747758504180681
0.746975796129928
Epoch 131/200, Loss: 0.04610510161590008
0.7465746241107334
Epoch 141/200, Loss: 0.0447130153576533
0.7496637527963882
Epoch 151/200, Loss: 0.043676799695406644
0.751276436759605
Epoch 161/200, Loss: 0.04281243451294445
0.74872682921

[I 2024-01-21 09:08:31,227] Trial 64 finished with value: 0.7516042997881057 and parameters: {'hidden_dim_h': 20, 'dropout': 0.11124131623908794, 'batch_size': 481}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.8722074883324757
0.5385483707009967
Epoch 11/200, Loss: 1.393543249084836
0.5730856125304955
Epoch 21/200, Loss: 0.6092331381071181
0.5656892023287532
Epoch 31/200, Loss: 0.2643865637836002
0.6351767431729413
Epoch 41/200, Loss: 0.16993191838264465
0.6471646221011983
Epoch 51/200, Loss: 0.14598881879023143
0.6634318149356723
Epoch 61/200, Loss: 0.1363045796751976
0.6768266203204584
Epoch 71/200, Loss: 0.12770258120837666
0.684236737001824
Epoch 81/200, Loss: 0.11792192572639101
0.6915162477253838
Epoch 91/200, Loss: 0.10787544044710341
0.7012509072605047
Epoch 101/200, Loss: 0.0968884788453579
0.7003587296242039
Epoch 111/200, Loss: 0.08793459939105171
0.7122063200698017
Epoch 121/200, Loss: 0.07794455492070743
0.724170531770169
Epoch 131/200, Loss: 0.07140759556066423
0.7218099802776069
Epoch 141/200, Loss: 0.06454988338408016
0.7307038174481115
Epoch 151/200, Loss: 0.05876258893736771
0.7322704428168755
Epoch 161/200, Loss: 0.05626486632085982
0.7346475573119511


[I 2024-01-21 09:09:33,970] Trial 65 finished with value: 0.7408556974119128 and parameters: {'hidden_dim_h': 19, 'dropout': 0.11208605363890774, 'batch_size': 477}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.23047806233167648
0.5907209193224312
Epoch 11/200, Loss: 0.1448391333222389
0.6483276563184646
Epoch 21/200, Loss: 0.11193219915032387
0.6691025210450209
Epoch 31/200, Loss: 0.09291839212179184
0.6870366927252097
Epoch 41/200, Loss: 0.07927883580327034
0.708746459840086
Epoch 51/200, Loss: 0.07148542180657387
0.7170917319250077
Epoch 61/200, Loss: 0.0661454214900732
0.7196698736291665
Epoch 71/200, Loss: 0.062089290991425516
0.727856212907947
Epoch 81/200, Loss: 0.0589850989729166
0.7419377797918776
Epoch 91/200, Loss: 0.05611758381128311
0.7401476585382581
Epoch 101/200, Loss: 0.053883477300405505
0.7392467125719818
Epoch 111/200, Loss: 0.05217712625861168
0.745640970347063
Epoch 121/200, Loss: 0.04983002446591854
0.7460482939632875
Epoch 131/200, Loss: 0.04846056222915649
0.7423019839318955
Epoch 141/200, Loss: 0.04737362042069435
0.7463694952273545
Epoch 151/200, Loss: 0.04610753014683724
0.7472781298364926
Epoch 161/200, Loss: 0.04473530039191246
0.743423790120

[I 2024-01-21 09:10:38,708] Trial 66 finished with value: 0.7507982332147913 and parameters: {'hidden_dim_h': 21, 'dropout': 0.1585807029951673, 'batch_size': 401}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.562801277637482
0.5561929331795206
Epoch 11/200, Loss: 1.1952077329158783
0.606768107126008
Epoch 21/200, Loss: 0.5729623734951019
0.6353437643822705
Epoch 31/200, Loss: 0.3403178259730339
0.6642546622000919
Epoch 41/200, Loss: 0.26996030621230604
0.6512092290792285
Epoch 51/200, Loss: 0.24422837160527705
0.6713621975269326
Epoch 61/200, Loss: 0.22363654114305972
0.6409100948947907
Epoch 71/200, Loss: 0.20235826596617698
0.6703099831465155
Epoch 81/200, Loss: 0.17960216104984283
0.6128596333960518
Epoch 91/200, Loss: 0.15651042610406876
0.6984905047442075
Epoch 101/200, Loss: 0.13392139058560132
0.663537145033314
Epoch 111/200, Loss: 0.11386788617819547
0.7083279790007452
Epoch 121/200, Loss: 0.09612916447222233
0.6659343203040841
Epoch 131/200, Loss: 0.08115646298974752
0.73192094023354
Epoch 141/200, Loss: 0.06909289564937353
0.6710559589105941
Epoch 151/200, Loss: 0.06072609936818481
0.7310812436873626
Epoch 161/200, Loss: 0.055016540084034206
0.7412654133920937

[I 2024-01-21 09:11:38,599] Trial 67 finished with value: 0.7473628897129445 and parameters: {'hidden_dim_h': 16, 'dropout': 0.08983745227121512, 'batch_size': 505}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.5787165732019477
0.5604055691157064
Epoch 11/200, Loss: 0.139726421278384
0.6525771337727035
Epoch 21/200, Loss: 0.12097414914104673
0.6653774098428936
Epoch 31/200, Loss: 0.10171850377486812
0.6940527923571415
Epoch 41/200, Loss: 0.08400385578473409
0.7069017594063839
Epoch 51/200, Loss: 0.07279054287614094
0.7157842204983536
Epoch 61/200, Loss: 0.062013581602109805
0.7310815338358755
Epoch 71/200, Loss: 0.05728895103351937
0.7295327954817173
Epoch 81/200, Loss: 0.05197820383020573
0.7345575112771455
Epoch 91/200, Loss: 0.0498394180710117
0.7253967564339374
Epoch 101/200, Loss: 0.0469532392712103
0.7376310962024403
Epoch 111/200, Loss: 0.044888451488481626
0.7439739611042334
Epoch 121/200, Loss: 0.04354465732143985
0.7438613491583559
Epoch 131/200, Loss: 0.041211988052560225
0.7384386719701677
Epoch 141/200, Loss: 0.03997639553724892
0.7465239378139688
Epoch 151/200, Loss: 0.03827405397573279
0.744888492412184
Epoch 161/200, Loss: 0.03725378825846645
0.73991034379

[I 2024-01-21 09:12:54,791] Trial 68 finished with value: 0.7465239378139688 and parameters: {'hidden_dim_h': 19, 'dropout': 0.05219079493242375, 'batch_size': 280}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.7551505195127951
0.5125624986014669
Epoch 11/200, Loss: 0.24586821448158575
0.6255202692044765
Epoch 21/200, Loss: 0.1448861445124085
0.6455522085298002
Epoch 31/200, Loss: 0.13093622814159137
0.6590545092551214
Epoch 41/200, Loss: 0.12149319274199975
0.6675541775533399
Epoch 51/200, Loss: 0.11336466931813471
0.6762773055214093
Epoch 61/200, Loss: 0.10630327402739911
0.6869314975826948
Epoch 71/200, Loss: 0.09695611088662534
0.6940945955336016
Epoch 81/200, Loss: 0.08966572723678641
0.6920106207486582
Epoch 91/200, Loss: 0.08282874222542788
0.703040579371811
Epoch 101/200, Loss: 0.07660661959970319
0.7069648448736257
Epoch 111/200, Loss: 0.07153031199767783
0.7102638753572587
Epoch 121/200, Loss: 0.06798633198077614
0.716647348374135
Epoch 131/200, Loss: 0.06488805183687725
0.7202662813581032
Epoch 141/200, Loss: 0.0622607979017335
0.7216364714184373
Epoch 151/200, Loss: 0.06021943587709118
0.7245583891832967
Epoch 161/200, Loss: 0.05867438390851021
0.7317294302713

[I 2024-01-21 09:13:56,625] Trial 69 finished with value: 0.736874595384333 and parameters: {'hidden_dim_h': 23, 'dropout': 0.2983526326344915, 'batch_size': 543}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.5242454541511223
0.5623009512030686
Epoch 11/200, Loss: 0.19898179906313537
0.6364931202604599
Epoch 21/200, Loss: 0.1620108810116033
0.6603723599110931
Epoch 31/200, Loss: 0.12927184925704707
0.6701560891971646
Epoch 41/200, Loss: 0.10418149352562232
0.6786337440143739
Epoch 51/200, Loss: 0.0849092600286984
0.6704457790673406
Epoch 61/200, Loss: 0.07289787925413398
0.7125042779508755
Epoch 71/200, Loss: 0.06542089526526264
0.7170374962380225
Epoch 81/200, Loss: 0.05988832703623615
0.7255434184736095
Epoch 91/200, Loss: 0.055983902581158235
0.7224626246373237
Epoch 101/200, Loss: 0.05296543777966108
0.7244360079061613
Epoch 111/200, Loss: 0.05073223598912114
0.7271020377122163
Epoch 121/200, Loss: 0.04724516768435963
0.7264054890287073
Epoch 131/200, Loss: 0.046246163119546706
0.7273118968704385
Epoch 141/200, Loss: 0.04299926672314034
0.7356811466670061
Epoch 151/200, Loss: 0.04417646090026762
0.7318052961906126
Epoch 161/200, Loss: 0.04165269617663055
0.735531147

[I 2024-01-21 09:15:16,090] Trial 70 finished with value: 0.7356811466670061 and parameters: {'hidden_dim_h': 34, 'dropout': 0.10390883836673025, 'batch_size': 333}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.3399397873065688
0.5860997452117135
Epoch 11/200, Loss: 0.17883225191723218
0.6397140590365854
Epoch 21/200, Loss: 0.1480370004746047
0.652062658103155
Epoch 31/200, Loss: 0.12084990841421214
0.684067330827989
Epoch 41/200, Loss: 0.10139731080694632
0.6807029491717468
Epoch 51/200, Loss: 0.08574270575561306
0.6959958859567192
Epoch 61/200, Loss: 0.07484400103038008
0.7072475908339318
Epoch 71/200, Loss: 0.06836221333254468
0.7205486889993485
Epoch 81/200, Loss: 0.06306332637640563
0.7308921066503687
Epoch 91/200, Loss: 0.05882867095483975
0.7292807670313115
Epoch 101/200, Loss: 0.055904738351025364
0.7324061912290976
Epoch 111/200, Loss: 0.052248028784312985
0.7322676315382817
Epoch 121/200, Loss: 0.04991852390495213
0.7342438169505388
Epoch 131/200, Loss: 0.04734351790764115
0.7348296455598488
Epoch 141/200, Loss: 0.04535322475501082
0.7364755357481301
Epoch 151/200, Loss: 0.0431273952126503
0.7444922168050986
Epoch 161/200, Loss: 0.042077645998109474
0.7397533749

[I 2024-01-21 09:16:22,889] Trial 71 finished with value: 0.7444922168050986 and parameters: {'hidden_dim_h': 30, 'dropout': 0.1427380974855874, 'batch_size': 455}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.1833139592781663
0.5772565780147371
Epoch 11/200, Loss: 0.12893287395127118
0.6479597142384758
Epoch 21/200, Loss: 0.10743474191986024
0.6609419019497675
Epoch 31/200, Loss: 0.09462607256136835
0.6691731128540856
Epoch 41/200, Loss: 0.0856620033737272
0.6901319634853966
Epoch 51/200, Loss: 0.08145885658450425
0.6865831700338487
Epoch 61/200, Loss: 0.07535511977039278
0.7035019406859292
Epoch 71/200, Loss: 0.07135705929249525
0.7140693680283202
Epoch 81/200, Loss: 0.06677034462336451
0.7166663081627287
Epoch 91/200, Loss: 0.0639387967530638
0.7190005142852438
Epoch 101/200, Loss: 0.06168756273109466
0.7297673753983587
Epoch 111/200, Loss: 0.05910938698798418
0.7346640628588653
Epoch 121/200, Loss: 0.05736621737014502
0.7356202656610267
Epoch 131/200, Loss: 0.055014514829963446
0.7411311235595688
Epoch 141/200, Loss: 0.05386440479196608
0.7405660766110499
Epoch 151/200, Loss: 0.05245919956360012
0.7459469813192476
Epoch 161/200, Loss: 0.05045069090556353
0.7417530226

[I 2024-01-21 09:17:23,744] Trial 72 finished with value: 0.7465819127809102 and parameters: {'hidden_dim_h': 22, 'dropout': 0.21991782336172544, 'batch_size': 641}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.23947637373546385
0.580988695472888
Epoch 11/200, Loss: 0.16705995038995203
0.6420994840443397
Epoch 21/200, Loss: 0.1249090331905293
0.6632847619665718
Epoch 31/200, Loss: 0.09932154951230535
0.6822731823532958
Epoch 41/200, Loss: 0.0857054352198007
0.6979632345482036
Epoch 51/200, Loss: 0.07492306392710164
0.703609135832001
Epoch 61/200, Loss: 0.06882452824205723
0.7133644982933459
Epoch 71/200, Loss: 0.0642826701953726
0.7185900076402103
Epoch 81/200, Loss: 0.06062325940660711
0.72649583975624
Epoch 91/200, Loss: 0.056718370121604994
0.7286396715790223
Epoch 101/200, Loss: 0.053750295684022724
0.729311125294107
Epoch 111/200, Loss: 0.05149664083179438
0.7390129704121359
Epoch 121/200, Loss: 0.049314716865993896
0.7384207199494431
Epoch 131/200, Loss: 0.04695150143695327
0.7409743813128739
Epoch 141/200, Loss: 0.04675741788913619
0.7423866735655075
Epoch 151/200, Loss: 0.043667308213013525
0.7395454640045396
Epoch 161/200, Loss: 0.042734826159364775
0.74278186747

[I 2024-01-21 09:18:34,361] Trial 73 finished with value: 0.7461139296082162 and parameters: {'hidden_dim_h': 28, 'dropout': 0.11895330404887094, 'batch_size': 382}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.6382362297603061
0.5652493192721446
Epoch 11/200, Loss: 0.7610962390899658
0.6215165402565506
Epoch 21/200, Loss: 0.41093919702938625
0.6393321859018982
Epoch 31/200, Loss: 0.3004199666636331
0.6459306282180232
Epoch 41/200, Loss: 0.2662103784935815
0.6551722011912564
Epoch 51/200, Loss: 0.24435262296880994
0.6574759176904904
Epoch 61/200, Loss: 0.22284408126558578
0.6740470893592807
Epoch 71/200, Loss: 0.19928199265684401
0.6870131016363207
Epoch 81/200, Loss: 0.17463819427149638
0.6978910607484808
Epoch 91/200, Loss: 0.1507884736571993
0.7112626045487415
Epoch 101/200, Loss: 0.1281252750328609
0.7208981754366628
Epoch 111/200, Loss: 0.10722086259296962
0.7194380568745569
Epoch 121/200, Loss: 0.09019478814942496
0.7318386050510387
Epoch 131/200, Loss: 0.07488745450973511
0.7451212985520108
Epoch 141/200, Loss: 0.06353675701788493
0.7438086249937513
Epoch 151/200, Loss: 0.05438042421426092
0.7450837325496211
Epoch 161/200, Loss: 0.04794466442295483
0.74766000962669

[I 2024-01-21 09:19:37,560] Trial 74 finished with value: 0.7523493637120173 and parameters: {'hidden_dim_h': 26, 'dropout': 0.12812810152359738, 'batch_size': 578}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.6093775394715761
0.5329786445762594
Epoch 11/200, Loss: 0.23157600078143573
0.6244566710469337
Epoch 21/200, Loss: 0.18176378505794624
0.6409988118253006
Epoch 31/200, Loss: 0.16199951344414762
0.6623636075751582
Epoch 41/200, Loss: 0.14104184175008222
0.6761362410140221
Epoch 51/200, Loss: 0.12187700385325834
0.6947556045295168
Epoch 61/200, Loss: 0.10308381052393663
0.7030069358602354
Epoch 71/200, Loss: 0.08711231519517146
0.7037226622534073
Epoch 81/200, Loss: 0.0750123123197179
0.7239843399761379
Epoch 91/200, Loss: 0.06626594684233791
0.7289498795250587
Epoch 101/200, Loss: 0.06055361522655738
0.731026077065495
Epoch 111/200, Loss: 0.05591972495772337
0.7308250390887612
Epoch 121/200, Loss: 0.05281338154485351
0.74014659884991
Epoch 131/200, Loss: 0.050281598575805365
0.7320212595774481
Epoch 141/200, Loss: 0.04876273027376125
0.7343580629999297
Epoch 151/200, Loss: 0.046739241304366214
0.7439873022872676
Epoch 161/200, Loss: 0.045408171846678384
0.7389047744

[I 2024-01-21 09:20:38,664] Trial 75 finished with value: 0.7447486819973034 and parameters: {'hidden_dim_h': 20, 'dropout': 0.1299762924592914, 'batch_size': 528}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.28493397909662
0.5782194884595059
Epoch 11/200, Loss: 0.1905483457705249
0.6299157116519347
Epoch 21/200, Loss: 0.13641585733579553
0.656034513927051
Epoch 31/200, Loss: 0.10409652733284494
0.6837849815230757
Epoch 41/200, Loss: 0.08607747033238411
0.6906136676067078
Epoch 51/200, Loss: 0.0746380697287943
0.7109936725519052
Epoch 61/200, Loss: 0.06578973672636178
0.7170186955249365
Epoch 71/200, Loss: 0.059900544583797455
0.7239632331823256
Epoch 81/200, Loss: 0.05657722971037678
0.7313708821523377
Epoch 91/200, Loss: 0.052080499737159065
0.7398448673134891
Epoch 101/200, Loss: 0.04904358607271443
0.7335457809694278
Epoch 111/200, Loss: 0.04662798693322617
0.7458543854310422
Epoch 121/200, Loss: 0.04439261968693008
0.7382398093586698
Epoch 131/200, Loss: 0.04357297467472761
0.7360743989616674
Epoch 141/200, Loss: 0.041360777924242226
0.7409183734079456
Epoch 151/200, Loss: 0.04009696339135584
0.7391300659867862
Epoch 161/200, Loss: 0.03789355945975884
0.74514295030

[I 2024-01-21 09:21:46,262] Trial 76 finished with value: 0.7474847642785023 and parameters: {'hidden_dim_h': 28, 'dropout': 0.10829963554179342, 'batch_size': 438}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.3096300246460097
0.5852739643732082
Epoch 11/200, Loss: 0.11785217303605307
0.642285916660854
Epoch 21/200, Loss: 0.10699626963053431
0.6636276205990258
Epoch 31/200, Loss: 0.09651976202925046
0.688101178262426
Epoch 41/200, Loss: 0.08650981439721017
0.699159162268154
Epoch 51/200, Loss: 0.0763098726137763
0.7127722230322107
Epoch 61/200, Loss: 0.06709418703048002
0.7196027550527836
Epoch 71/200, Loss: 0.05987813918008691
0.7296880510907896
Epoch 81/200, Loss: 0.054315866281588875
0.7338041497191234
Epoch 91/200, Loss: 0.049523002335003445
0.7268280318506041
Epoch 101/200, Loss: 0.04719585774555093
0.7393644066547019
Epoch 111/200, Loss: 0.04385422737825485
0.7374034255509448
Epoch 121/200, Loss: 0.04141787226711001
0.7343146463259551
Epoch 131/200, Loss: 0.0386549091587464
0.7380866548831461
Epoch 141/200, Loss: 0.0373080244642638
0.7427328972636403
Epoch 151/200, Loss: 0.035972160508944875
0.7364251863839675
Epoch 161/200, Loss: 0.03469981807505801
0.743968199200

[I 2024-01-21 09:22:52,480] Trial 77 finished with value: 0.7439681992006966 and parameters: {'hidden_dim_h': 26, 'dropout': 0.06720988801759274, 'batch_size': 482}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.2691801854542324
0.47920211670823304
Epoch 11/200, Loss: 0.4750266288008009
0.6274791409443321
Epoch 21/200, Loss: 0.18636306950024195
0.6498378215515794
Epoch 31/200, Loss: 0.10855182792459216
0.6808216487095884
Epoch 41/200, Loss: 0.08983669770615442
0.7045820938822722
Epoch 51/200, Loss: 0.08366184724228723
0.700590325940661
Epoch 61/200, Loss: 0.07822598900113786
0.7158480847622513
Epoch 71/200, Loss: 0.0722920940390655
0.7232440314430021
Epoch 81/200, Loss: 0.06661463975906372
0.7250848725462733
Epoch 91/200, Loss: 0.06115577487008912
0.732244069630676
Epoch 101/200, Loss: 0.05605459607073239
0.7372674562624207
Epoch 111/200, Loss: 0.05146091527172497
0.7340370240403887
Epoch 121/200, Loss: 0.0472564405628613
0.7389889878920279
Epoch 131/200, Loss: 0.04343833423086575
0.7439295568153528
Epoch 141/200, Loss: 0.040792370587587355
0.7500217767913614
Epoch 151/200, Loss: 0.03833792539579528
0.7435321773961009
Epoch 161/200, Loss: 0.037009281771523614
0.74078199110

[I 2024-01-21 09:23:57,777] Trial 78 finished with value: 0.7500217767913614 and parameters: {'hidden_dim_h': 32, 'dropout': 0.09404277666853741, 'batch_size': 574}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.6884401768445969
0.5539146246649312
Epoch 11/200, Loss: 0.3580713853240013
0.6013670395880915
Epoch 21/200, Loss: 0.23333344757556915
0.6388379596000877
Epoch 31/200, Loss: 0.19063502475619315
0.6476302142076742
Epoch 41/200, Loss: 0.17596958056092263
0.6594884251936478
Epoch 51/200, Loss: 0.16509175822138786
0.6658567406603306
Epoch 61/200, Loss: 0.1558895505964756
0.6735140886960561
Epoch 71/200, Loss: 0.14472882077097893
0.6870915202887723
Epoch 81/200, Loss: 0.1338477037847042
0.6986489867152824
Epoch 91/200, Loss: 0.12337082289159298
0.7007305329488396
Epoch 101/200, Loss: 0.11271945387125015
0.7080724611440402
Epoch 111/200, Loss: 0.10400142408907413
0.7154699315906125
Epoch 121/200, Loss: 0.09434870779514312
0.7182282691257286
Epoch 131/200, Loss: 0.08693251870572567
0.7189873870612462
Epoch 141/200, Loss: 0.08045541569590568
0.7296424461248406
Epoch 151/200, Loss: 0.0742914192378521
0.7273631103758135
Epoch 161/200, Loss: 0.06863821726292371
0.7314127261091

[I 2024-01-21 09:24:53,716] Trial 79 finished with value: 0.7387202958040895 and parameters: {'hidden_dim_h': 18, 'dropout': 0.14036219367621855, 'batch_size': 1040}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.20578275714069605
0.5872963132071173
Epoch 11/200, Loss: 0.12746653938665986
0.6435703376579464
Epoch 21/200, Loss: 0.10325072954098384
0.661722053576087
Epoch 31/200, Loss: 0.0862683819917341
0.7008154682419142
Epoch 41/200, Loss: 0.07455698711176713
0.7068868945376802
Epoch 51/200, Loss: 0.06678180722519755
0.7183589178337194
Epoch 61/200, Loss: 0.059797210696463786
0.7236766007140247
Epoch 71/200, Loss: 0.05523622392987212
0.7389960195463773
Epoch 81/200, Loss: 0.05086088653964301
0.7443218146346231
Epoch 91/200, Loss: 0.04885324579663575
0.7396379631266268
Epoch 101/200, Loss: 0.0459100732114166
0.750840703698382
Epoch 111/200, Loss: 0.04411775525659323
0.7515825400958842
Epoch 121/200, Loss: 0.04234974808059633
0.7454200810226713
Epoch 131/200, Loss: 0.039706163108348846
0.7513694439403721
Epoch 141/200, Loss: 0.038577546598389745
0.7494611572337072
Epoch 151/200, Loss: 0.03705688511642317
0.748119662017265
Epoch 161/200, Loss: 0.036115674573617675
0.749334265

[I 2024-01-21 09:25:58,635] Trial 80 finished with value: 0.7515825400958842 and parameters: {'hidden_dim_h': 23, 'dropout': 0.07981418029090079, 'batch_size': 422}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.8384118917140555
0.5654154551360353
Epoch 11/200, Loss: 0.21875383467116255
0.6355226995076853
Epoch 21/200, Loss: 0.13412943656774276
0.6654459957231921
Epoch 31/200, Loss: 0.11966536035563083
0.6954073844182512
Epoch 41/200, Loss: 0.10633401620261212
0.702590511397333
Epoch 51/200, Loss: 0.09328621483229577
0.7126267021758782
Epoch 61/200, Loss: 0.08061391226154693
0.7216555504316147
Epoch 71/200, Loss: 0.07008396588424419
0.7345664984836479
Epoch 81/200, Loss: 0.06227537450638223
0.7363564538021982
Epoch 91/200, Loss: 0.054471726588746334
0.7431438852514882
Epoch 101/200, Loss: 0.049143171690879985
0.7369503292267514
Epoch 111/200, Loss: 0.046953977818818805
0.7411670736114407
Epoch 121/200, Loss: 0.04326189127057157
0.7398588988913185
Epoch 131/200, Loss: 0.04178407431599942
0.7386993306593452
Epoch 141/200, Loss: 0.040368028936233924
0.7414496914957919
Epoch 151/200, Loss: 0.03872947917973742
0.7451928781786558
Epoch 161/200, Loss: 0.0372960460471346
0.7481160

[I 2024-01-21 09:27:02,033] Trial 81 finished with value: 0.7481160343035803 and parameters: {'hidden_dim_h': 21, 'dropout': 0.07343303479412333, 'batch_size': 430}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 2.902523994445801
0.5130408875830554
Epoch 11/200, Loss: 1.1733664904000625
0.611391792056526
Epoch 21/200, Loss: 0.45758485962759776
0.003720523225210285
Epoch 31/200, Loss: 0.2834796278544192
0.013987903382114537
Epoch 41/200, Loss: 0.2586782822069132
0.005279381549203553
Epoch 51/200, Loss: 0.25821468205946796
0.014190466608706546
Epoch 61/200, Loss: 0.25532528195741044
0.010296962720857795
Epoch 71/200, Loss: 0.25380742268742257
0.018569698042397515
Epoch 81/200, Loss: 0.2546064555644989
0.03365248398833208
Epoch 91/200, Loss: 0.25789084665055545
0.023210283504527314
Epoch 101/200, Loss: 0.25263525376904683
0.06700083274992297
Epoch 111/200, Loss: 0.25252364941363065
0.05405145920181266
Epoch 121/200, Loss: 0.2530775044886571
0.03433364026841457
Epoch 131/200, Loss: 0.25229882491084765
0.04608032924794866
Epoch 141/200, Loss: 0.25084121609633825
0.054735066446809505
Epoch 151/200, Loss: 0.25373116979059185
0.02517359359055837
Epoch 161/200, Loss: 0.25272840992459

[I 2024-01-21 09:28:13,198] Trial 82 finished with value: 0.611391792056526 and parameters: {'hidden_dim_h': 30, 'dropout': 0.07698899291326304, 'batch_size': 380}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.2620632590317145
0.5396455174376377
Epoch 11/200, Loss: 0.40976093164304406
0.6315645521789996
Epoch 21/200, Loss: 0.15983587830531887
0.6692917063591401
Epoch 31/200, Loss: 0.11154558891203345
0.6819334187469814
Epoch 41/200, Loss: 0.09940455817594761
0.6964441928893119
Epoch 51/200, Loss: 0.09206769324657393
0.7107297170152134
Epoch 61/200, Loss: 0.08268801686240405
0.7296938570357563
Epoch 71/200, Loss: 0.07402629986768816
0.7315222155377745
Epoch 81/200, Loss: 0.06738450723450358
0.7381115148695495
Epoch 91/200, Loss: 0.06082791126355892
0.7308283771912985
Epoch 101/200, Loss: 0.05322196434547261
0.7485321611119449
Epoch 111/200, Loss: 0.04807256480179182
0.7392622705150007
Epoch 121/200, Loss: 0.0436549063135938
0.7374452486686518
Epoch 131/200, Loss: 0.04036902463654193
0.7333023523309821
Epoch 141/200, Loss: 0.037699597637827806
0.73448117787399
Epoch 151/200, Loss: 0.036364027776005795
0.7413817928445599
Epoch 161/200, Loss: 0.0349286496184948
0.73458319879

[I 2024-01-21 09:29:16,513] Trial 83 finished with value: 0.7485321611119449 and parameters: {'hidden_dim_h': 23, 'dropout': 0.06234519180907491, 'batch_size': 496}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.3153963200747967
0.5868415740623415
Epoch 11/200, Loss: 0.15423012574513753
0.6502722648621589
Epoch 21/200, Loss: 0.12171856611967087
0.6717997011037478
Epoch 31/200, Loss: 0.09640058676401773
0.6923015276400983
Epoch 41/200, Loss: 0.08169637632866701
0.7047874544730925
Epoch 51/200, Loss: 0.07325992559393248
0.7128620785799139
Epoch 61/200, Loss: 0.06628251671791077
0.7266957686242957
Epoch 71/200, Loss: 0.06065357010811567
0.7323393778186987
Epoch 81/200, Loss: 0.05700496416538954
0.7311852170139593
Epoch 91/200, Loss: 0.053378988554080326
0.7323084692218895
Epoch 101/200, Loss: 0.050637462610999745
0.7304446236651146
Epoch 111/200, Loss: 0.04733234761903683
0.7413459161519182
Epoch 121/200, Loss: 0.04600001716365417
0.7409956675920674
Epoch 131/200, Loss: 0.04500018426527579
0.7422255909534046
Epoch 141/200, Loss: 0.042588153419395286
0.7475026410556648
Epoch 151/200, Loss: 0.04153771226604779
0.7482755159744499
Epoch 161/200, Loss: 0.04010408104707797
0.738677

[I 2024-01-21 09:30:27,818] Trial 84 finished with value: 0.7482755159744499 and parameters: {'hidden_dim_h': 24, 'dropout': 0.09907268987973639, 'batch_size': 334}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.2926653067068178
0.5764347847978752
Epoch 11/200, Loss: 0.18468031348014363
0.6436341128170336
Epoch 21/200, Loss: 0.13848292538706136
0.6576319606480115
Epoch 31/200, Loss: 0.10766201466321945
0.6724353336234029
Epoch 41/200, Loss: 0.0897500032977182
0.6853820946040361
Epoch 51/200, Loss: 0.07977243163147751
0.703516023417272
Epoch 61/200, Loss: 0.07227879504160005
0.7127666076659045
Epoch 71/200, Loss: 0.0667166145024251
0.7249696108940238
Epoch 81/200, Loss: 0.06287197411364438
0.728350438753508
Epoch 91/200, Loss: 0.061234360826866965
0.7317787560619583
Epoch 101/200, Loss: 0.057644009286043595
0.7365059039963748
Epoch 111/200, Loss: 0.05584234478218215
0.7396942688719673
Epoch 121/200, Loss: 0.05401526855266824
0.7391937834495019
Epoch 131/200, Loss: 0.051207896017906616
0.7386160902894864
Epoch 141/200, Loss: 0.05018842410372228
0.7361764413415656
Epoch 151/200, Loss: 0.048713547614764194
0.7395789322549385
Epoch 161/200, Loss: 0.048001980218960315
0.74388497

[I 2024-01-21 09:31:32,697] Trial 85 finished with value: 0.7438849743907209 and parameters: {'hidden_dim_h': 20, 'dropout': 0.12823883412396633, 'batch_size': 415}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.44558097008201814
0.5819013899887273
Epoch 11/200, Loss: 0.1543059539463785
0.6594650096387016
Epoch 21/200, Loss: 0.12488607813914616
0.6567744027034875
Epoch 31/200, Loss: 0.11265493598249224
0.6943288351582553
Epoch 41/200, Loss: 0.10114029049873352
0.7130577951809236
Epoch 51/200, Loss: 0.08970603326128589
0.7161218760740757
Epoch 61/200, Loss: 0.07864969430698289
0.721197905957654
Epoch 71/200, Loss: 0.06984337088134554
0.7278373483544933
Epoch 81/200, Loss: 0.06122635998245743
0.7366407746726183
Epoch 91/200, Loss: 0.05472955480217934
0.7385488019090818
Epoch 101/200, Loss: 0.049892921207679644
0.7430415705479505
Epoch 111/200, Loss: 0.046690486268036895
0.7418800354183228
Epoch 121/200, Loss: 0.04393845620668597
0.7424794610903047
Epoch 131/200, Loss: 0.04084745577226082
0.7451848942406629
Epoch 141/200, Loss: 0.04006479225224919
0.7473497689229569
Epoch 151/200, Loss: 0.038193388428125113
0.7404945629471962
Epoch 161/200, Loss: 0.037086643589039646
0.744401

[I 2024-01-21 09:32:36,262] Trial 86 finished with value: 0.7510170385623135 and parameters: {'hidden_dim_h': 26, 'dropout': 0.1147183620624167, 'batch_size': 557}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.4195669970729135
0.43102717879035807
Epoch 11/200, Loss: 0.47832265157591214
0.6134610620385308
Epoch 21/200, Loss: 0.2032714547081427
0.6475336237745176
Epoch 31/200, Loss: 0.15489377098327334
0.6583261234933455
Epoch 41/200, Loss: 0.14222999221899293
0.6760063744718292
Epoch 51/200, Loss: 0.131316811862317
0.68532230088482
Epoch 61/200, Loss: 0.1176282846453515
0.6944649156026619
Epoch 71/200, Loss: 0.10580443523146889
0.7034402654506843
Epoch 81/200, Loss: 0.09314527650448409
0.7145751837691598
Epoch 91/200, Loss: 0.08277846974405376
0.7071204993425599
Epoch 101/200, Loss: 0.07454941811209376
0.7162725269640677
Epoch 111/200, Loss: 0.06596770027483051
0.7284238047319478
Epoch 121/200, Loss: 0.06060377779332074
0.730196895146645
Epoch 131/200, Loss: 0.05799417722631584
0.731474147385489
Epoch 141/200, Loss: 0.054157536646181885
0.7395504542703435
Epoch 151/200, Loss: 0.05172107182443142
0.7385212275834436
Epoch 161/200, Loss: 0.05118782039393078
0.745851249427934

[I 2024-01-21 09:33:39,784] Trial 87 finished with value: 0.7458512494279343 and parameters: {'hidden_dim_h': 17, 'dropout': 0.08186748513564969, 'batch_size': 463}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.20789949091918328
0.5861285990268988
Epoch 11/200, Loss: 0.13249074667692184
0.6489030515653801
Epoch 21/200, Loss: 0.10045061435769587
0.6597805498374778
Epoch 31/200, Loss: 0.08631161074427997
0.6854599657619684
Epoch 41/200, Loss: 0.0793707673163975
0.6945967204581829
Epoch 51/200, Loss: 0.07455428996506859
0.7041667465833883
Epoch 61/200, Loss: 0.07051832316552892
0.7175368519703175
Epoch 71/200, Loss: 0.06783216189154807
0.7242293256222946
Epoch 81/200, Loss: 0.0657289840061875
0.7217779366267112
Epoch 91/200, Loss: 0.0613349733655067
0.7236503349003677
Epoch 101/200, Loss: 0.05895961240372237
0.7306060411575497
Epoch 111/200, Loss: 0.05858518835157156
0.7363199871491108
Epoch 121/200, Loss: 0.05527766120127019
0.7402425251642283
Epoch 131/200, Loss: 0.05379937506993027
0.7358143655515443
Epoch 141/200, Loss: 0.05217802102732308
0.739538852670307
Epoch 151/200, Loss: 0.050694845726384836
0.7342511483877384
Epoch 161/200, Loss: 0.048826103865662045
0.7472826690

[I 2024-01-21 09:34:53,810] Trial 88 finished with value: 0.7472826690687755 and parameters: {'hidden_dim_h': 22, 'dropout': 0.17353334976510626, 'batch_size': 297}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.6449359961045094
0.5621032123025507
Epoch 11/200, Loss: 0.17056032289297152
0.6413284543606292
Epoch 21/200, Loss: 0.09953029434650372
0.6486977051231265
Epoch 31/200, Loss: 0.0909985982072659
0.6890190748640658
Epoch 41/200, Loss: 0.08488913300709847
0.6969979644881186
Epoch 51/200, Loss: 0.07869272755506711
0.7002187795332689
Epoch 61/200, Loss: 0.07366443692873685
0.7120371902201695
Epoch 71/200, Loss: 0.06789201469375537
0.7222023742177776
Epoch 81/200, Loss: 0.06244793916359926
0.7247219030855858
Epoch 91/200, Loss: 0.05843647349721346
0.7365000087061107
Epoch 101/200, Loss: 0.054137616872023314
0.7379240416221904
Epoch 111/200, Loss: 0.051309409814003185
0.7368200299114346
Epoch 121/200, Loss: 0.04622275831225591
0.7367417388825604
Epoch 131/200, Loss: 0.04409571488698324
0.7446777943285711
Epoch 141/200, Loss: 0.04099694247811268
0.7360699745634353
Epoch 151/200, Loss: 0.0392956867431983
0.7397487964700569
Epoch 161/200, Loss: 0.037340908573988155
0.74202344

[I 2024-01-21 09:36:04,795] Trial 89 finished with value: 0.7446777943285711 and parameters: {'hidden_dim_h': 33, 'dropout': 0.08896925659397037, 'batch_size': 518}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.22927558649988736
0.5763162233655901
Epoch 11/200, Loss: 0.14136170516995822
0.6441959968854581
Epoch 21/200, Loss: 0.10136776461320765
0.6696159365962175
Epoch 31/200, Loss: 0.08326249552123687
0.6870181645278457
Epoch 41/200, Loss: 0.07518332061522147
0.7072027571117032
Epoch 51/200, Loss: 0.07244601907098995
0.714619716560184
Epoch 61/200, Loss: 0.06748776413938579
0.7187627881849883
Epoch 71/200, Loss: 0.06544102649478352
0.7284127132328522
Epoch 81/200, Loss: 0.06261286069365109
0.7145003815872285
Epoch 91/200, Loss: 0.059493025611428656
0.7341452894750108
Epoch 101/200, Loss: 0.05683313086628914
0.7369923727001246
Epoch 111/200, Loss: 0.05425142921945628
0.7375566040235326
Epoch 121/200, Loss: 0.051886490732431415
0.7300548351942968
Epoch 131/200, Loss: 0.05022377972217167
0.740467999012206
Epoch 141/200, Loss: 0.049701784244355035
0.7398779383695316
Epoch 151/200, Loss: 0.04663076970507117
0.7387319298072577
Epoch 161/200, Loss: 0.04566143396146157
0.7413191

[I 2024-01-21 09:37:30,385] Trial 90 finished with value: 0.7456549280304957 and parameters: {'hidden_dim_h': 29, 'dropout': 0.11561078097648611, 'batch_size': 236}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.39246549570199213
0.5678178894483947
Epoch 11/200, Loss: 0.16800908202474768
0.6453554599529061
Epoch 21/200, Loss: 0.14495642844474677
0.6604726944167613
Epoch 31/200, Loss: 0.13252057925318228
0.6621497932871324
Epoch 41/200, Loss: 0.12022492605628389
0.6789010643126907
Epoch 51/200, Loss: 0.10669653704672148
0.6843491730714879
Epoch 61/200, Loss: 0.09583489687153787
0.7007284906251423
Epoch 71/200, Loss: 0.0844832927440152
0.7109325716306463
Epoch 81/200, Loss: 0.07482805622346474
0.7187133635289507
Epoch 91/200, Loss: 0.06759395337466037
0.7243682464929626
Epoch 101/200, Loss: 0.06208912023540699
0.7348715772139456
Epoch 111/200, Loss: 0.05729492268327511
0.7379118022288274
Epoch 121/200, Loss: 0.053906229635079704
0.7444647921288682
Epoch 131/200, Loss: 0.050870566769982827
0.742837515159387
Epoch 141/200, Loss: 0.048727698624134064
0.737513833503062
Epoch 151/200, Loss: 0.04658832705833695
0.7443684716606761
Epoch 161/200, Loss: 0.04526713095379598
0.74244858

[I 2024-01-21 09:38:31,243] Trial 91 finished with value: 0.7456677977123034 and parameters: {'hidden_dim_h': 24, 'dropout': 0.15648815681795408, 'batch_size': 609}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 1.0725148439407348
0.5686821003947419
Epoch 11/200, Loss: 0.5246235847473144
0.6145335653302737
Epoch 21/200, Loss: 0.33403615256150565
0.64370285217469
Epoch 31/200, Loss: 0.27962505221366885
0.6522289674232088
Epoch 41/200, Loss: 0.2547788063685099
0.6554209214034092
Epoch 51/200, Loss: 0.23269511063893636
0.6579227980053733
Epoch 61/200, Loss: 0.21007493486007053
0.6611302676407547
Epoch 71/200, Loss: 0.18630673438310624
0.6832294512460082
Epoch 81/200, Loss: 0.16277302503585817
0.6987040284823289
Epoch 91/200, Loss: 0.13960522810618084
0.7138819324067464
Epoch 101/200, Loss: 0.1186033084988594
0.72481156615923
Epoch 111/200, Loss: 0.0997815969089667
0.7239601990866106
Epoch 121/200, Loss: 0.0841724211970965
0.7330391919463162
Epoch 131/200, Loss: 0.07134450636804104
0.7341775135473319
Epoch 141/200, Loss: 0.06062750791509946
0.7405881618797087
Epoch 151/200, Loss: 0.05235224093000094
0.73941489706334
Epoch 161/200, Loss: 0.046747863416870435
0.7384427649765177
Ep

[I 2024-01-21 09:39:33,135] Trial 92 finished with value: 0.7421321839927312 and parameters: {'hidden_dim_h': 27, 'dropout': 0.1065802124977205, 'batch_size': 676}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.21377341007744824
0.5690029171063804
Epoch 11/200, Loss: 0.15351224221565105
0.6372645150064978
Epoch 21/200, Loss: 0.12688758582980544
0.6560333250681579
Epoch 31/200, Loss: 0.10700085345241758
0.6760442558295563
Epoch 41/200, Loss: 0.09280739669446592
0.6864373262719299
Epoch 51/200, Loss: 0.08143722873043131
0.6961641487551167
Epoch 61/200, Loss: 0.07237976099605914
0.7085951154084669
Epoch 71/200, Loss: 0.06651496197338458
0.7227029145915824
Epoch 81/200, Loss: 0.061542361698768755
0.7301193241101436
Epoch 91/200, Loss: 0.05764869159018552
0.7345153576027977
Epoch 101/200, Loss: 0.05476048947484405
0.7410451576753969
Epoch 111/200, Loss: 0.05188048548168606
0.7457707060076576
Epoch 121/200, Loss: 0.04945198087780564
0.7432314602885817
Epoch 131/200, Loss: 0.04751801463188948
0.7509601585882424
Epoch 141/200, Loss: 0.04553047277861171
0.7447098700924811
Epoch 151/200, Loss: 0.044709283858537674
0.7458090098570119
Epoch 161/200, Loss: 0.04308580234646797
0.744711

[I 2024-01-21 09:40:34,424] Trial 93 finished with value: 0.7509601585882424 and parameters: {'hidden_dim_h': 25, 'dropout': 0.14618092765402113, 'batch_size': 749}. Best is trial 16 with value: 0.756164132510553.


Epoch 1/200, Loss: 0.35690698671985316
0.5736486739723867
Epoch 11/200, Loss: 0.16846696669990952
0.6385152386451346
Epoch 21/200, Loss: 0.14635466321094617
0.6620666400976782
Epoch 31/200, Loss: 0.12558479989702637
0.6763926530463882
Epoch 41/200, Loss: 0.10601131638159624
0.6947417786484885
Epoch 51/200, Loss: 0.08958295853556814
0.7087895125367119
Epoch 61/200, Loss: 0.07720493827317212
0.7202316300185533
Epoch 71/200, Loss: 0.0672347716785766
0.7269314663766655
Epoch 81/200, Loss: 0.06069777714642319
0.7369593160662032
Epoch 91/200, Loss: 0.05672605738446519
0.7385445016652255
Epoch 101/200, Loss: 0.05344417650957365
0.746279777636979
Epoch 111/200, Loss: 0.05017506502367355
0.7445352402267276
Epoch 121/200, Loss: 0.04755093489547033
0.7433452143565749
Epoch 131/200, Loss: 0.04656523868844316
0.7488521244926197
Epoch 141/200, Loss: 0.044605338694276034
0.7484687163514611
Epoch 151/200, Loss: 0.04307461640722043
0.7601027427382819
Epoch 161/200, Loss: 0.04093383071390358
0.755798950

[I 2024-01-21 09:41:36,215] Trial 94 finished with value: 0.7601027427382819 and parameters: {'hidden_dim_h': 23, 'dropout': 0.12805161023112027, 'batch_size': 544}. Best is trial 94 with value: 0.7601027427382819.


Epoch 1/200, Loss: 0.45105262100696564
0.5688187611956164
Epoch 11/200, Loss: 0.1769403355817
0.6413105219903749
Epoch 21/200, Loss: 0.14903147725595367
0.6527351335010704
Epoch 31/200, Loss: 0.1346060254921516
0.6720967901421641
Epoch 41/200, Loss: 0.12062716421981652
0.6851479810455221
Epoch 51/200, Loss: 0.10650839946336216
0.6917578110653747
Epoch 61/200, Loss: 0.09382359310984612
0.6990155358355952
Epoch 71/200, Loss: 0.0814476464357641
0.7203466011155126
Epoch 81/200, Loss: 0.07103395606908533
0.7311895179978017
Epoch 91/200, Loss: 0.06375176242242257
0.7314641805990727
Epoch 101/200, Loss: 0.05741430912166834
0.7350358918829463
Epoch 111/200, Loss: 0.05366281378600332
0.7449959778390723
Epoch 121/200, Loss: 0.05013234137247006
0.742096363826742
Epoch 131/200, Loss: 0.047892188653349876
0.7470489711356207
Epoch 141/200, Loss: 0.04563117720600632
0.7449111899073907
Epoch 151/200, Loss: 0.04449526241256131
0.7488551790476378
Epoch 161/200, Loss: 0.04216430149972439
0.74956251241020

[I 2024-01-21 09:42:37,559] Trial 95 finished with value: 0.750328764353553 and parameters: {'hidden_dim_h': 23, 'dropout': 0.13484093657115964, 'batch_size': 562}. Best is trial 94 with value: 0.7601027427382819.


Epoch 1/200, Loss: 2.1216597778852595
0.5021378562087597
Epoch 11/200, Loss: 0.9183065419973329
0.6100411226388197
Epoch 21/200, Loss: 0.4162579573864161
0.6140882033130955
Epoch 31/200, Loss: 0.21885129220263902
0.6468219950269284
Epoch 41/200, Loss: 0.17806362343388935
0.6672985333844116
Epoch 51/200, Loss: 0.16362369025862494
0.6656103061278188
Epoch 61/200, Loss: 0.14912607018337692
0.6857794203763704
Epoch 71/200, Loss: 0.13468025659405908
0.6936491034143133
Epoch 81/200, Loss: 0.1195740930216257
0.7004517210410286
Epoch 91/200, Loss: 0.10539201820312544
0.7131758302497293
Epoch 101/200, Loss: 0.0924223805236262
0.7207161650158443
Epoch 111/200, Loss: 0.08003319297419038
0.7257982143348092
Epoch 121/200, Loss: 0.07097547128796577
0.7250417578927918
Epoch 131/200, Loss: 0.06357779301876246
0.7347092688805306
Epoch 141/200, Loss: 0.058992491818444674
0.7386087175714734
Epoch 151/200, Loss: 0.054330582795448085
0.7377938212575071
Epoch 161/200, Loss: 0.05190019474126572
0.73840228298

[I 2024-01-21 09:43:41,923] Trial 96 finished with value: 0.7451805437531918 and parameters: {'hidden_dim_h': 22, 'dropout': 0.13053774607361757, 'batch_size': 469}. Best is trial 94 with value: 0.7601027427382819.


Epoch 1/200, Loss: 1.4858059883117676
0.49897810038177065
Epoch 11/200, Loss: 0.76514918381168
0.6179514010660934
Epoch 21/200, Loss: 0.4015328663010751
0.14140440073983537
Epoch 31/200, Loss: 0.24243649215467514
0.5469957509639235
Epoch 41/200, Loss: 0.18314536540739
0.6355113883526874
Epoch 51/200, Loss: 0.16651474708510983
0.6633069399104481
Epoch 61/200, Loss: 0.15595105626890737
0.6746183628329994
Epoch 71/200, Loss: 0.14580663606043784
0.681122248582155
Epoch 81/200, Loss: 0.13632823622995807
0.6765822065295138
Epoch 91/200, Loss: 0.12470972730267432
0.6870828247847636
Epoch 101/200, Loss: 0.11644867399046498
0.6920893940270652
Epoch 111/200, Loss: 0.10535674974803001
0.7087768750366416
Epoch 121/200, Loss: 0.09642582819346458
0.7099094787089691
Epoch 131/200, Loss: 0.08790857825548418
0.7165912849771403
Epoch 141/200, Loss: 0.08135470002889633
0.7192176330704207
Epoch 151/200, Loss: 0.07543919139331387
0.7189474113736266
Epoch 161/200, Loss: 0.07067239212412987
0.726244735411795

[I 2024-01-21 09:44:45,178] Trial 97 finished with value: 0.7383678544820484 and parameters: {'hidden_dim_h': 31, 'dropout': 0.09862615159881767, 'batch_size': 648}. Best is trial 94 with value: 0.7601027427382819.


Epoch 1/200, Loss: 0.35071899235248566
0.5812017684641576
Epoch 11/200, Loss: 0.22619321703910827
0.6228007593133374
Epoch 21/200, Loss: 0.16383529156446458
0.6572353776686054
Epoch 31/200, Loss: 0.12302219972014428
0.6640518191240349
Epoch 41/200, Loss: 0.09750863537192345
0.6949577000631573
Epoch 51/200, Loss: 0.08314053401350975
0.7041634039480514
Epoch 61/200, Loss: 0.07432890348136426
0.7134006063701935
Epoch 71/200, Loss: 0.06951108299195767
0.7149471186966948
Epoch 81/200, Loss: 0.06596597515046597
0.7201006716251644
Epoch 91/200, Loss: 0.06329051606357097
0.728018050939979
Epoch 101/200, Loss: 0.059821832552552225
0.7297250524256933
Epoch 111/200, Loss: 0.057527995109558104
0.7317140726661504
Epoch 121/200, Loss: 0.056098053604364394
0.7394815501090354
Epoch 131/200, Loss: 0.054343602061271666
0.7378551362532113
Epoch 141/200, Loss: 0.05170028321444988
0.7426218535197361
Epoch 151/200, Loss: 0.050481738969683644
0.7476591958720332
Epoch 161/200, Loss: 0.048639259710907934
0.741

[I 2024-01-21 09:45:49,984] Trial 98 finished with value: 0.7476591958720332 and parameters: {'hidden_dim_h': 20, 'dropout': 0.1486104359338494, 'batch_size': 405}. Best is trial 94 with value: 0.7601027427382819.


Epoch 1/200, Loss: 4.040617409505342
0.46312266136690955
Epoch 11/200, Loss: 2.254516030612745
0.5276403248107603
Epoch 21/200, Loss: 1.2205898542153208
0.5686745010112969
Epoch 31/200, Loss: 0.6770377441456443
0.6176333184646121
Epoch 41/200, Loss: 0.41000850969239283
0.3258662037317496
Epoch 51/200, Loss: 0.2437906586810162
0.6256608623314219
Epoch 61/200, Loss: 0.19601949265128688
0.638590875211637
Epoch 71/200, Loss: 0.17945631475825058
0.6475425351050966
Epoch 81/200, Loss: 0.16857773418489255
0.6588517310245882
Epoch 91/200, Loss: 0.15846163152079834
0.6634623910602645
Epoch 101/200, Loss: 0.1463971863451757
0.6794718283487811
Epoch 111/200, Loss: 0.13390926448138138
0.6904614902049112
Epoch 121/200, Loss: 0.12181849032640457
0.688987199210248
Epoch 131/200, Loss: 0.10922741223322718
0.7073786301347038
Epoch 141/200, Loss: 0.09780918767577723
0.7072472260779789
Epoch 151/200, Loss: 0.0873923276207949
0.7232872469657333
Epoch 161/200, Loss: 0.07826442565572889
0.7245908080934816
E

[I 2024-01-21 09:46:50,476] Trial 99 finished with value: 0.7394443620941293 and parameters: {'hidden_dim_h': 18, 'dropout': 0.1657532538257177, 'batch_size': 531}. Best is trial 94 with value: 0.7601027427382819.


Best Trial:
  Value: 0.7601
  Params: 
    hidden_dim_h: 23
    dropout: 0.12805161023112027
    batch_size: 544


### 1 layers modified softmax

In [160]:
import optuna
from scipy.stats import pearsonr
learning_rate = 0.001
epochs = 200
num_heads = 4
num_layers = 1
sequence_length = L
input_dim = AA_size*L
output_dim = 1
dropout_init = 0.3
batch_size_init = 1000
hidden_dim_h_init = 32

def objective(trial):
    # Define the hyperparameters to be optimized
    # hidden_dim_h = trial.suggest_int('hidden_dim_h', hidden_dim_h_init, 10, 50)
    # dropout = trial.suggest_float('dropout', dropout_init, 0.05, 0.35)
    # batch_size = trial.suggest_int('batch_size', batch_size_init, 100, 1200)

    hidden_dim_h = trial.suggest_int('hidden_dim_h', 10, 50)
    dropout = trial.suggest_float('dropout', 0.05, 0.35)
    batch_size = trial.suggest_int('batch_size', 100, 1200)
    
    model = Transformer_torch_MHA(input_dim, hidden_dim_h*num_heads, num_layers, num_heads, dropout).to(device)
    
    train_loader = data.DataLoader(train_dataset,
                                   batch_size=batch_size,
                                   shuffle=True,
                                   drop_last=False)
    criterion = nn.MSELoss()
    optimizer = optim.Adam(model.parameters(), lr=learning_rate)

    r2_test = []
    try: 
        for epoch in range(epochs):

                model.train()
                total_loss = 0
                for batch_inputs, batch_targets in train_loader:
                    optimizer.zero_grad()
                    outputs = model(batch_inputs)
                    loss = criterion(outputs, batch_targets)
                    loss.backward()
                    optimizer.step()
                    total_loss += loss.item()

                if epoch % 10 == 0:
                    print(f"Epoch {epoch+1}/{epochs}, Loss: {total_loss/len(train_loader)}")
                    model.eval()
                    pred, true = model(X_test.flatten(1)).flatten().detach().cpu().numpy(), y_test.flatten().detach().cpu().numpy()
                    print(pearsonr(pred, true)[0]**2)
                    if pearsonr(pred, true)[0]**2 == "nan":
                        break
                    r2_test.append(pearsonr(pred, true)[0]**2)
                    
    except: print("training failed")
            
    return np.array(r2_test).max()

In [161]:
# Create and run the Optuna study
study = optuna.create_study(direction='maximize')
study.optimize(objective, n_trials=100)

# Print the best hyperparameters
best_trial = study.best_trial
print("Best Trial:")
print(f"  Value: {best_trial.value:.4f}")
print("  Params: ")
for key, value in best_trial.params.items():
    print(f"    {key}: {value}")

# You can then use the best hyperparameters to train your final model.


[I 2024-01-21 00:18:19,801] A new study created in memory with name: no-name-5210cbaf-f9c6-43a5-b741-7ff722bab4d9


Epoch 1/200, Loss: 0.7255596537142992
0.5840938040514972
Epoch 11/200, Loss: 0.2647275999188423
0.6380150141554315
Epoch 21/200, Loss: 0.151542445179075
0.6472748756562398
Epoch 31/200, Loss: 0.132892552530393
0.6524717229412433
Epoch 41/200, Loss: 0.12694646744057536
0.6526360246074108
Epoch 51/200, Loss: 0.12181926844641566
0.656070005286557
Epoch 61/200, Loss: 0.11647798912599683
0.6542225979070825
Epoch 71/200, Loss: 0.11137970862910151
0.657197126711261
Epoch 81/200, Loss: 0.10636953520588577
0.6542905883461627
Epoch 91/200, Loss: 0.10244861943647265
0.6554086400343904
Epoch 101/200, Loss: 0.09870132501237094
0.6565829519901396
Epoch 111/200, Loss: 0.09573330520652235
0.6586292765231113
Epoch 121/200, Loss: 0.09366344125010073
0.6567653005641216
Epoch 131/200, Loss: 0.09205860923975706
0.6609650725415648
Epoch 141/200, Loss: 0.09098838968202472
0.6592849741725845
Epoch 151/200, Loss: 0.09055739338509738
0.6600430291847288
Epoch 161/200, Loss: 0.08982385112904012
0.6597757656992393

[I 2024-01-21 00:19:04,435] Trial 0 finished with value: 0.6624350913052945 and parameters: {'hidden_dim_h': 23, 'dropout': 0.08659115453083338, 'batch_size': 626}. Best is trial 0 with value: 0.6624350913052945.


Epoch 1/200, Loss: 0.8850822210311889
0.5833943696758652
Epoch 11/200, Loss: 0.22448545230759515
0.6339279728931273
Epoch 21/200, Loss: 0.11689566572507222
0.6454298365150488
Epoch 31/200, Loss: 0.10832512792613772
0.6523077218891639
Epoch 41/200, Loss: 0.10468807336356904
0.6496975735010428
Epoch 51/200, Loss: 0.10196336458126704
0.6545679831734033
Epoch 61/200, Loss: 0.09913829101456537
0.6601098108808862
Epoch 71/200, Loss: 0.09668091734250386
0.6589921085620146
Epoch 81/200, Loss: 0.09471323937177659
0.657008271759396
Epoch 91/200, Loss: 0.09374889615509245
0.6555203118084191
Epoch 101/200, Loss: 0.09242145005199644
0.6606800014533838
Epoch 111/200, Loss: 0.09172025670607885
0.655344924304318
Epoch 121/200, Loss: 0.09128994511233436
0.6588230908145432
Epoch 131/200, Loss: 0.0915049884054396
0.6605370685057649
Epoch 141/200, Loss: 0.09166089296340943
0.6619584416274162
Epoch 151/200, Loss: 0.09110488974385791
0.6529256073210931
Epoch 161/200, Loss: 0.09131028685304854
0.660315973844

[I 2024-01-21 00:19:53,729] Trial 1 finished with value: 0.6619584416274162 and parameters: {'hidden_dim_h': 29, 'dropout': 0.18998205734048196, 'batch_size': 446}. Best is trial 0 with value: 0.6624350913052945.


Epoch 1/200, Loss: 0.6230156728715608
0.5817712910962907
Epoch 11/200, Loss: 0.28069155595519324
0.6502864963353888
Epoch 21/200, Loss: 0.22045197947458786
0.6515087524314743
Epoch 31/200, Loss: 0.19913906716939175
0.6523289143915387
Epoch 41/200, Loss: 0.17902253929412726
0.6520901207366989
Epoch 51/200, Loss: 0.15951100849744046
0.6555203639028069
Epoch 61/200, Loss: 0.1422123136845502
0.6534536702750282
Epoch 71/200, Loss: 0.1275669573382898
0.6579202587235833
Epoch 81/200, Loss: 0.11531038582324982
0.6524536173354912
Epoch 91/200, Loss: 0.10640095196890109
0.655915919322928
Epoch 101/200, Loss: 0.10019744819763934
0.6589957371343844
Epoch 111/200, Loss: 0.09600481210332928
0.6572775366920461
Epoch 121/200, Loss: 0.09310645158543732
0.6571701442654163
Epoch 131/200, Loss: 0.09180208024653522
0.6558763238012031
Epoch 141/200, Loss: 0.09115409873651736
0.6590903772397851
Epoch 151/200, Loss: 0.09067576875289281
0.6629984673366028
Epoch 161/200, Loss: 0.09078664287473216
0.656457301785

[I 2024-01-21 00:20:40,939] Trial 2 finished with value: 0.6629984673366028 and parameters: {'hidden_dim_h': 31, 'dropout': 0.1405655291690381, 'batch_size': 607}. Best is trial 2 with value: 0.6629984673366028.


Epoch 1/200, Loss: 2.781076519112838
0.550253122134725
Epoch 11/200, Loss: 2.0054106524116113
0.5884080533172684
Epoch 21/200, Loss: 1.4247204880965383
0.10519026545326852
Epoch 31/200, Loss: 0.9372856052298295
0.5872162929282804
Epoch 41/200, Loss: 0.6137696284996835
0.6108357253892711
Epoch 51/200, Loss: 0.4086174588454397
0.6227990247649206
Epoch 61/200, Loss: 0.28319101898293747
0.631896987788262
Epoch 71/200, Loss: 0.21017718550406003
0.6406484854187195
Epoch 81/200, Loss: 0.17220398940538106
0.6464780071652214
Epoch 91/200, Loss: 0.1526928457774614
0.6481996879049009
Epoch 101/200, Loss: 0.14311558478756956
0.6524122054442002
Epoch 111/200, Loss: 0.13883278244420102
0.6526862250098814
Epoch 121/200, Loss: 0.13516671092886673
0.6550365192036598
Epoch 131/200, Loss: 0.1325324620855482
0.6560440830428284
Epoch 141/200, Loss: 0.1304596980151377
0.6549952073517314
Epoch 151/200, Loss: 0.12788440992957667
0.6590049996993378
Epoch 161/200, Loss: 0.125247034979494
0.6564941495567108
Epoc

[I 2024-01-21 00:21:22,589] Trial 3 finished with value: 0.6590049996993378 and parameters: {'hidden_dim_h': 17, 'dropout': 0.22078036188865147, 'batch_size': 1094}. Best is trial 2 with value: 0.6629984673366028.


Epoch 1/200, Loss: 1.6716084503660016
0.564069103215463
Epoch 11/200, Loss: 0.4682083983047336
0.6169320347592729
Epoch 21/200, Loss: 0.1545110225093131
0.635875853227481
Epoch 31/200, Loss: 0.10873989381042182
0.6472598044765869
Epoch 41/200, Loss: 0.1036346231897672
0.6458476238635046
Epoch 51/200, Loss: 0.10216662302321079
0.6572569656456203
Epoch 61/200, Loss: 0.10005740660662744
0.6565217798532053
Epoch 71/200, Loss: 0.09746407702857372
0.6552903956776482
Epoch 81/200, Loss: 0.09601451281239004
0.6557322474016618
Epoch 91/200, Loss: 0.09432235871459924
0.6549064246645897
Epoch 101/200, Loss: 0.0930548963301322
0.6553119555716413
Epoch 111/200, Loss: 0.09244038237660539
0.6584353404260793
Epoch 121/200, Loss: 0.0920440989966486
0.6598946833954067
Epoch 131/200, Loss: 0.09233490859760958
0.6586910239544438
Epoch 141/200, Loss: 0.09151787603018331
0.6602775517868393
Epoch 151/200, Loss: 0.09141878053253773
0.6634719126564141
Epoch 161/200, Loss: 0.09153324570141587
0.6593552245612355

[I 2024-01-21 00:22:16,624] Trial 4 finished with value: 0.6634719126564141 and parameters: {'hidden_dim_h': 36, 'dropout': 0.17830178013188575, 'batch_size': 396}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.5002144778316672
0.563279023038594
Epoch 11/200, Loss: 0.2647315785288811
0.6249560215809913
Epoch 21/200, Loss: 0.20828312838619406
0.6414137265713917
Epoch 31/200, Loss: 0.19141936166719956
0.6478196951314439
Epoch 41/200, Loss: 0.1780349612236023
0.6461503644304605
Epoch 51/200, Loss: 0.16580687260085886
0.6495980246197375
Epoch 61/200, Loss: 0.15367198329080234
0.650182337055921
Epoch 71/200, Loss: 0.1425580450079658
0.6496124823767172
Epoch 81/200, Loss: 0.13261195035143333
0.6518446766730587
Epoch 91/200, Loss: 0.12350460311228578
0.6537407795923769
Epoch 101/200, Loss: 0.11626939881931651
0.65844284381609
Epoch 111/200, Loss: 0.11053630337119102
0.6486287370726602
Epoch 121/200, Loss: 0.10536942055279558
0.6543416592975108
Epoch 131/200, Loss: 0.10162596743215215
0.6557161332049173
Epoch 141/200, Loss: 0.09854126213626428
0.6573258661640482
Epoch 151/200, Loss: 0.09671571749177846
0.6602582678998233
Epoch 161/200, Loss: 0.09543196247382597
0.6559645242470471

[I 2024-01-21 00:22:58,703] Trial 5 finished with value: 0.6626781450604118 and parameters: {'hidden_dim_h': 13, 'dropout': 0.30473788097494486, 'batch_size': 937}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 3.079625461782728
0.48713720604335936
Epoch 11/200, Loss: 1.929486674921853
0.5863793045102349
Epoch 21/200, Loss: 1.181415970836367
0.22543030541295644
Epoch 31/200, Loss: 0.6417440623044968
0.6065803383246456
Epoch 41/200, Loss: 0.3590811075908797
0.627142837261607
Epoch 51/200, Loss: 0.22720472940376826
0.6365199080820878
Epoch 61/200, Loss: 0.17106859545622552
0.6475297883283041
Epoch 71/200, Loss: 0.1499005960566657
0.651673106053623
Epoch 81/200, Loss: 0.14189666935375758
0.653300758058506
Epoch 91/200, Loss: 0.1376246895108904
0.6541653900397495
Epoch 101/200, Loss: 0.13353336762104714
0.653022220348496
Epoch 111/200, Loss: 0.12961467142615998
0.6537229532452629
Epoch 121/200, Loss: 0.1261365810143096
0.6521757870908603
Epoch 131/200, Loss: 0.12156146205961704
0.6558081718847497
Epoch 141/200, Loss: 0.11757115035184793
0.6570980613102406
Epoch 151/200, Loss: 0.1138903833925724
0.6600066280850359
Epoch 161/200, Loss: 0.10962621495127678
0.6575100300009277
Epoch

[I 2024-01-21 00:23:42,977] Trial 6 finished with value: 0.6605334744969457 and parameters: {'hidden_dim_h': 23, 'dropout': 0.1321489501052531, 'batch_size': 729}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.4989910219845019
0.5811347227494179
Epoch 11/200, Loss: 0.2823046806611513
0.6301726859659219
Epoch 21/200, Loss: 0.21646847301407865
0.6426526215725954
Epoch 31/200, Loss: 0.19615917848913292
0.6504943474785193
Epoch 41/200, Loss: 0.18448960702670247
0.6510837157428281
Epoch 51/200, Loss: 0.17332265486842707
0.6517401526484613
Epoch 61/200, Loss: 0.1625909083767941
0.654299247829097
Epoch 71/200, Loss: 0.1520146939315294
0.6523282470962416
Epoch 81/200, Loss: 0.14206969738006592
0.6536027220692175
Epoch 91/200, Loss: 0.13283334554810272
0.6551750505105348
Epoch 101/200, Loss: 0.12494667737107527
0.6500908920156324
Epoch 111/200, Loss: 0.1177826433589584
0.6586030384546359
Epoch 121/200, Loss: 0.11165706029063777
0.6549608517421157
Epoch 131/200, Loss: 0.10634865337296535
0.6598673766239683
Epoch 141/200, Loss: 0.10254908941294018
0.6586245449164976
Epoch 151/200, Loss: 0.09899548284317318
0.6550337432616681
Epoch 161/200, Loss: 0.09655897985947759
0.65492535846484

[I 2024-01-21 00:24:27,486] Trial 7 finished with value: 0.661684472303644 and parameters: {'hidden_dim_h': 27, 'dropout': 0.16920716126178764, 'batch_size': 1061}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.21388543605804444
0.5923491394934242
Epoch 11/200, Loss: 0.11441643923521042
0.6503172103490669
Epoch 21/200, Loss: 0.09588354867696762
0.6550746203355159
Epoch 31/200, Loss: 0.0931549152135849
0.6593997634223465
Epoch 41/200, Loss: 0.09318159556388855
0.6602962744457979
Epoch 51/200, Loss: 0.09254331794381142
0.6576211808309104
Epoch 61/200, Loss: 0.09247446006536483
0.6599026938043454
Epoch 71/200, Loss: 0.09206921428442001
0.66142967409939
Epoch 81/200, Loss: 0.0929565577507019
0.6587766725468461
Epoch 91/200, Loss: 0.09161735343933106
0.6559363697664219
Epoch 101/200, Loss: 0.09208788746595382
0.6616126337680894
Epoch 111/200, Loss: 0.09139051064848899
0.6562298018425349
Epoch 121/200, Loss: 0.09201601481437684
0.6631799961473059
Epoch 131/200, Loss: 0.0916092883348465
0.6574800241175779
Epoch 141/200, Loss: 0.09179394435882568
0.6601215387022873
Epoch 151/200, Loss: 0.09126515966653824
0.6590690338292382
Epoch 161/200, Loss: 0.09176725077629089
0.6582015995357

[I 2024-01-21 00:25:45,421] Trial 8 finished with value: 0.6631799961473059 and parameters: {'hidden_dim_h': 14, 'dropout': 0.12335055399679382, 'batch_size': 160}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.28157921723879065
0.5926219939600015
Epoch 11/200, Loss: 0.1245134442000632
0.6338377909041842
Epoch 21/200, Loss: 0.09832087467620328
0.6483812600277364
Epoch 31/200, Loss: 0.09475367008500797
0.6507314339210469
Epoch 41/200, Loss: 0.09462930523096376
0.6561950161294522
Epoch 51/200, Loss: 0.09432548899084899
0.6591924582361487
Epoch 61/200, Loss: 0.09367859997092538
0.6552119355460867
Epoch 71/200, Loss: 0.09334605429202887
0.6511810514492301
Epoch 81/200, Loss: 0.09305551116633567
0.6582623012811422
Epoch 91/200, Loss: 0.09260920653487467
0.6548034195220891
Epoch 101/200, Loss: 0.09285678349103138
0.6565583046965121
Epoch 111/200, Loss: 0.09245080633717738
0.6554360475625899
Epoch 121/200, Loss: 0.09220724348809309
0.6568738214487594
Epoch 131/200, Loss: 0.09242624091874262
0.6576212074941981
Epoch 141/200, Loss: 0.09203877394935887
0.6569192093763806
Epoch 151/200, Loss: 0.09222667502939322
0.6595560958590512
Epoch 161/200, Loss: 0.09245647855435207
0.659353273

[I 2024-01-21 00:27:19,284] Trial 9 finished with value: 0.6605512502118763 and parameters: {'hidden_dim_h': 48, 'dropout': 0.10516522005653312, 'batch_size': 128}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.24384083405688958
0.5827566379321423
Epoch 11/200, Loss: 0.1630744602945116
0.6433611797770866
Epoch 21/200, Loss: 0.12551794766827865
0.6470354541048601
Epoch 31/200, Loss: 0.10515784085900695
0.6517323618346804
Epoch 41/200, Loss: 0.09879583341104013
0.6501567120413704
Epoch 51/200, Loss: 0.0956539155708419
0.6584716980696403
Epoch 61/200, Loss: 0.09387340893348058
0.6550491441264986
Epoch 71/200, Loss: 0.09413661849167612
0.6538854357055935
Epoch 81/200, Loss: 0.09433384143092015
0.6524677166753704
Epoch 91/200, Loss: 0.09303996229061375
0.6533007787479423
Epoch 101/200, Loss: 0.09342074132076016
0.6536587805308978
Epoch 111/200, Loss: 0.09371175203058454
0.6582469529925086
Epoch 121/200, Loss: 0.09282382011965469
0.6603976353747675
Epoch 131/200, Loss: 0.0918676156412672
0.6559329230996575
Epoch 141/200, Loss: 0.09269607011918668
0.6604704353046792
Epoch 151/200, Loss: 0.09402645531075972
0.6577786737566897
Epoch 161/200, Loss: 0.09353121025142846
0.65820991685

[I 2024-01-21 00:28:15,230] Trial 10 finished with value: 0.6604704353046792 and parameters: {'hidden_dim_h': 40, 'dropout': 0.25880379825281663, 'batch_size': 377}. Best is trial 4 with value: 0.6634719126564141.


Epoch 1/200, Loss: 0.3768403824143762
0.5993793155944568
Epoch 11/200, Loss: 0.14180602958338373
0.6461778659534203
Epoch 21/200, Loss: 0.10201115921239724
0.6505864361613397
Epoch 31/200, Loss: 0.09436640030885703
0.6573512207041377
Epoch 41/200, Loss: 0.09399677858056638
0.6591552911556349
Epoch 51/200, Loss: 0.09321610322034599
0.6543141108445025
Epoch 61/200, Loss: 0.09256866466779037
0.6562158034707475
Epoch 71/200, Loss: 0.09271093967976986
0.6599626671523864
Epoch 81/200, Loss: 0.09183009113841409
0.6588296319277025
Epoch 91/200, Loss: 0.09247194255558436
0.660116197770166
Epoch 101/200, Loss: 0.09277387058374865
0.6620649534322512
Epoch 111/200, Loss: 0.09213357953817253
0.6629020468294867
Epoch 121/200, Loss: 0.09209256306690658
0.658566837454735
Epoch 131/200, Loss: 0.09207015492072042
0.6594450421003949
Epoch 141/200, Loss: 0.09164499516455119
0.6606530557625664
Epoch 151/200, Loss: 0.09089747036263447
0.6614723630950707
Epoch 161/200, Loss: 0.09184317088267147
0.65709701753

[I 2024-01-21 00:29:44,856] Trial 11 finished with value: 0.664822187307751 and parameters: {'hidden_dim_h': 38, 'dropout': 0.06038334966705082, 'batch_size': 135}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.23243144620209932
0.5917419276587746
Epoch 11/200, Loss: 0.15891738422214985
0.6388209613276761
Epoch 21/200, Loss: 0.1212436908390373
0.6408495740222614
Epoch 31/200, Loss: 0.10230941302143037
0.650499338074193
Epoch 41/200, Loss: 0.09469797869678587
0.6527772556013081
Epoch 51/200, Loss: 0.0920515509787947
0.6595146965443254
Epoch 61/200, Loss: 0.09114387666340917
0.6540745652916355
Epoch 71/200, Loss: 0.09101166040636599
0.6599536061309684
Epoch 81/200, Loss: 0.09065813093911856
0.6602091100594532
Epoch 91/200, Loss: 0.09053715958725661
0.6591546601835995
Epoch 101/200, Loss: 0.0906747707631439
0.6583168208075845
Epoch 111/200, Loss: 0.09024708333890885
0.6595373583712896
Epoch 121/200, Loss: 0.09046476217918098
0.661269018643601
Epoch 131/200, Loss: 0.09065518388524652
0.6585881846486362
Epoch 141/200, Loss: 0.09030228736810386
0.662163382989638
Epoch 151/200, Loss: 0.09045037964824587
0.6579829595567563
Epoch 161/200, Loss: 0.09042940195649862
0.66223850873973

[I 2024-01-21 00:30:44,289] Trial 12 finished with value: 0.6628035426617174 and parameters: {'hidden_dim_h': 38, 'dropout': 0.05654784178392291, 'batch_size': 314}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 2.6196501064300537
0.5365205760915771
Epoch 11/200, Loss: 0.6920791975657146
0.6223119107850784
Epoch 21/200, Loss: 0.2428463105360667
0.593730704172544
Epoch 31/200, Loss: 0.18524198551972706
0.6337627430070215
Epoch 41/200, Loss: 0.1654378738005956
0.643438494406676
Epoch 51/200, Loss: 0.14449865102767945
0.6490942152108677
Epoch 61/200, Loss: 0.12448491136233011
0.6477491592825861
Epoch 71/200, Loss: 0.10948536396026612
0.6455023807085437
Epoch 81/200, Loss: 0.10023737251758576
0.6528899727330717
Epoch 91/200, Loss: 0.09570006350676219
0.6520397210820725
Epoch 101/200, Loss: 0.09406195729970931
0.6548186477196472
Epoch 111/200, Loss: 0.0936974373459816
0.6561589026651486
Epoch 121/200, Loss: 0.09314028084278107
0.6561241966926883
Epoch 131/200, Loss: 0.0938010095556577
0.6589779015176014
Epoch 141/200, Loss: 0.09353862474362055
0.657535567778935
Epoch 151/200, Loss: 0.09428790499766668
0.6593276327746558
Epoch 161/200, Loss: 0.0934912579258283
0.6570093874467684
E

[I 2024-01-21 00:31:47,568] Trial 13 finished with value: 0.6603626272799316 and parameters: {'hidden_dim_h': 38, 'dropout': 0.2405343699614549, 'batch_size': 269}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.2272477565809738
0.582360254598955
Epoch 11/200, Loss: 0.49442629966624946
0.04093959072211819
Epoch 21/200, Loss: 0.226651429090389
0.6071102572027524
Epoch 31/200, Loss: 0.18619960303916488
0.6418774192071823
Epoch 41/200, Loss: 0.17177545227283655
0.6363604903517732
Epoch 51/200, Loss: 0.1582155432118926
0.6432027335531595
Epoch 61/200, Loss: 0.1450386643409729
0.6484695852815962
Epoch 71/200, Loss: 0.132068503561408
0.6511849113400541
Epoch 81/200, Loss: 0.12098800910766734
0.6438302912916448
Epoch 91/200, Loss: 0.11197807414587153
0.6511699730584526
Epoch 101/200, Loss: 0.1049599181427512
0.6541721734900922
Epoch 111/200, Loss: 0.09956844861424247
0.6518358481943858
Epoch 121/200, Loss: 0.09836813253025677
0.6520101781360997
Epoch 131/200, Loss: 0.09608911168436672
0.6572613585828898
Epoch 141/200, Loss: 0.09528789149467336
0.6587578109338184
Epoch 151/200, Loss: 0.09490375896525938
0.6541387299930846
Epoch 161/200, Loss: 0.09497488567302394
0.6578793429602398

[I 2024-01-21 00:32:43,129] Trial 14 finished with value: 0.6587578109338184 and parameters: {'hidden_dim_h': 46, 'dropout': 0.3478476458700087, 'batch_size': 473}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.8202991963742854
0.5883636293603884
Epoch 11/200, Loss: 0.16216916124244313
0.6402682464502711
Epoch 21/200, Loss: 0.13898251197495304
0.653444682865098
Epoch 31/200, Loss: 0.11805027821561792
0.6437296675662063
Epoch 41/200, Loss: 0.10283833594767602
0.6575699025844433
Epoch 51/200, Loss: 0.09472402545449497
0.6580576357106521
Epoch 61/200, Loss: 0.09227778508767977
0.6571096166292717
Epoch 71/200, Loss: 0.09128802056823458
0.6594763875886852
Epoch 81/200, Loss: 0.09116407713064781
0.6552475253974829
Epoch 91/200, Loss: 0.09170082760053677
0.6562432719121204
Epoch 101/200, Loss: 0.09165641755520643
0.6601654627415504
Epoch 111/200, Loss: 0.09163800954491227
0.657714663423131
Epoch 121/200, Loss: 0.09049772348377731
0.6586739750748833
Epoch 131/200, Loss: 0.09122878525938306
0.6601963976193213
Epoch 141/200, Loss: 0.0904101584475119
0.6596968957044083
Epoch 151/200, Loss: 0.09076623282917254
0.6561385494878242
Epoch 161/200, Loss: 0.09167550012960539
0.661305402918

[I 2024-01-21 00:33:48,810] Trial 15 finished with value: 0.6630113097437628 and parameters: {'hidden_dim_h': 34, 'dropout': 0.05173166675415641, 'batch_size': 222}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.18320346002134016
0.6077190821277102
Epoch 11/200, Loss: 0.10309035203617471
0.6464179805636167
Epoch 21/200, Loss: 0.09702960973113312
0.6398754361165595
Epoch 31/200, Loss: 0.09632712660521424
0.6423713259269276
Epoch 41/200, Loss: 0.09589447797194046
0.6564499275071841
Epoch 51/200, Loss: 0.09493975078812535
0.65127756028709
Epoch 61/200, Loss: 0.09508854716321347
0.6520690188707715
Epoch 71/200, Loss: 0.09469257810495678
0.6516798911567799
Epoch 81/200, Loss: 0.09415177095662126
0.6533272925742893
Epoch 91/200, Loss: 0.09402678320136094
0.6563177748850633
Epoch 101/200, Loss: 0.09385673273258259
0.655654144306699
Epoch 111/200, Loss: 0.09373128024253202
0.657506910564162
Epoch 121/200, Loss: 0.09381293049902496
0.6583468602395852
Epoch 131/200, Loss: 0.09294850552946793
0.6577902473568993
Epoch 141/200, Loss: 0.09361171170374272
0.6581322413783349
Epoch 151/200, Loss: 0.09388172508753026
0.6574689794444794
Epoch 161/200, Loss: 0.09319624453396995
0.659520619975

[I 2024-01-21 00:35:39,371] Trial 16 finished with value: 0.6598725819933416 and parameters: {'hidden_dim_h': 45, 'dropout': 0.16395201737883294, 'batch_size': 104}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.3220014583605986
0.58617172460422
Epoch 11/200, Loss: 0.24425532153019539
0.6381522337019747
Epoch 21/200, Loss: 0.2055075804774578
0.644155741525554
Epoch 31/200, Loss: 0.172791709120457
0.6441715659656129
Epoch 41/200, Loss: 0.14792530238628387
0.6527364748795927
Epoch 51/200, Loss: 0.12916541013580102
0.6474537306849385
Epoch 61/200, Loss: 0.11547023401810573
0.6539094803758843
Epoch 71/200, Loss: 0.106310584797309
0.6538987164668403
Epoch 81/200, Loss: 0.10055064152066524
0.654131741772925
Epoch 91/200, Loss: 0.0969212668446394
0.6599712046899024
Epoch 101/200, Loss: 0.09513055733763255
0.6567605117948762
Epoch 111/200, Loss: 0.09394999220967293
0.6600325799650822
Epoch 121/200, Loss: 0.09279061567324859
0.6595631125915749
Epoch 131/200, Loss: 0.09290079199350797
0.6610989526398157
Epoch 141/200, Loss: 0.092180263537627
0.6591342127189261
Epoch 151/200, Loss: 0.09211531568032044
0.6600158621764646
Epoch 161/200, Loss: 0.09251142293214798
0.6628515708348717
Epoc

[I 2024-01-21 00:36:30,856] Trial 17 finished with value: 0.6628515708348717 and parameters: {'hidden_dim_h': 42, 'dropout': 0.2863419188965738, 'batch_size': 781}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.394170869337885
0.5825370867566961
Epoch 11/200, Loss: 0.152746718180807
0.6439920087448753
Epoch 21/200, Loss: 0.13532457677157303
0.6401864269818308
Epoch 31/200, Loss: 0.12612126591174225
0.651305620710162
Epoch 41/200, Loss: 0.11682197784906939
0.656870886040843
Epoch 51/200, Loss: 0.1091409184430775
0.6571092528455948
Epoch 61/200, Loss: 0.10302406863162392
0.6544029048581573
Epoch 71/200, Loss: 0.09928855535231139
0.6549411438479134
Epoch 81/200, Loss: 0.09566892977607877
0.6558723573221981
Epoch 91/200, Loss: 0.09373550293476958
0.6593883039611752
Epoch 101/200, Loss: 0.09271526944480445
0.6591219973925342
Epoch 111/200, Loss: 0.09245592767470762
0.6577070021178568
Epoch 121/200, Loss: 0.0913147222446768
0.6603558155392352
Epoch 131/200, Loss: 0.09145161725188557
0.6541123633893714
Epoch 141/200, Loss: 0.09130045203001876
0.6623152996689669
Epoch 151/200, Loss: 0.09158644687972571
0.6593654818288315
Epoch 161/200, Loss: 0.09091422589201677
0.6569190987239637

[I 2024-01-21 00:37:21,324] Trial 18 finished with value: 0.6623152996689669 and parameters: {'hidden_dim_h': 34, 'dropout': 0.19652985905883266, 'batch_size': 534}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.108287770097906
0.5929523346842555
Epoch 11/200, Loss: 0.34879092953421853
0.6367305636445539
Epoch 21/200, Loss: 0.24733546674251555
0.642039336966883
Epoch 31/200, Loss: 0.21523195180025967
0.6453518485010366
Epoch 41/200, Loss: 0.1843240575356917
0.63918163730173
Epoch 51/200, Loss: 0.15485724251378666
0.6503727762883046
Epoch 61/200, Loss: 0.13223388289863414
0.6538975948304009
Epoch 71/200, Loss: 0.11416450291872024
0.6556110931243592
Epoch 81/200, Loss: 0.10313252359628677
0.6540632391980501
Epoch 91/200, Loss: 0.09707390300252221
0.6546017234106645
Epoch 101/200, Loss: 0.0936040455644781
0.655632147493258
Epoch 111/200, Loss: 0.09215707088058644
0.6581253861398653
Epoch 121/200, Loss: 0.09154897250912407
0.6603290793405596
Epoch 131/200, Loss: 0.09237621968442744
0.6556447669468749
Epoch 141/200, Loss: 0.09313164353370666
0.6610437925147826
Epoch 151/200, Loss: 0.09091995670036836
0.6584374288913567
Epoch 161/200, Loss: 0.09012948464263569
0.6620262012222602

[I 2024-01-21 00:38:16,816] Trial 19 finished with value: 0.6620262012222602 and parameters: {'hidden_dim_h': 35, 'dropout': 0.0856939833901119, 'batch_size': 370}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.24084151868360587
0.6016490033840901
Epoch 11/200, Loss: 0.13640833897403923
0.6430868153585019
Epoch 21/200, Loss: 0.10394811432763755
0.6470385693902361
Epoch 31/200, Loss: 0.0952876960656729
0.6470535050584841
Epoch 41/200, Loss: 0.0936366881591728
0.6566477534533501
Epoch 51/200, Loss: 0.09344819978059056
0.6556399541556692
Epoch 61/200, Loss: 0.0930778291749667
0.657072527974919
Epoch 71/200, Loss: 0.09238524932459176
0.6579351627414011
Epoch 81/200, Loss: 0.09278987967465298
0.6557779689404675
Epoch 91/200, Loss: 0.09243663193949733
0.6559449898482212
Epoch 101/200, Loss: 0.0926357001425272
0.6587849610918926
Epoch 111/200, Loss: 0.09204686801117587
0.6597894199308009
Epoch 121/200, Loss: 0.092107103082789
0.6583318341102539
Epoch 131/200, Loss: 0.09220120059438498
0.6588551037879049
Epoch 141/200, Loss: 0.09185224654803793
0.660285048865463
Epoch 151/200, Loss: 0.09137894823608628
0.6608610839312725
Epoch 161/200, Loss: 0.0916549930550966
0.6581649268063998


[I 2024-01-21 00:39:25,010] Trial 20 finished with value: 0.6608610839312725 and parameters: {'hidden_dim_h': 43, 'dropout': 0.16126833247599026, 'batch_size': 243}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 2.8304297670853877
0.5702093391502813
Epoch 11/200, Loss: 0.44475454724995434
0.6204440981743464
Epoch 21/200, Loss: 0.2069893315830062
0.6225836136099585
Epoch 31/200, Loss: 0.1701188422409834
0.6424082387954327
Epoch 41/200, Loss: 0.13366891278893547
0.6483181470231597
Epoch 51/200, Loss: 0.10760591284627408
0.6517589274165914
Epoch 61/200, Loss: 0.09640999276817372
0.6556842274666117
Epoch 71/200, Loss: 0.09272361048950559
0.6576873275238728
Epoch 81/200, Loss: 0.09240597334846987
0.6595418134190627
Epoch 91/200, Loss: 0.09262238970372529
0.6576970075453399
Epoch 101/200, Loss: 0.0920072535827624
0.6607099788038051
Epoch 111/200, Loss: 0.0920422648170353
0.662901277128802
Epoch 121/200, Loss: 0.09202332089168835
0.6617968506955033
Epoch 131/200, Loss: 0.09156797865850735
0.6630540856481959
Epoch 141/200, Loss: 0.09186445677702405
0.6637104640372161
Epoch 151/200, Loss: 0.09102169305613611
0.6634755422994548
Epoch 161/200, Loss: 0.09175712219645492
0.66092041634393

[I 2024-01-21 00:40:37,510] Trial 21 finished with value: 0.6637104640372161 and parameters: {'hidden_dim_h': 13, 'dropout': 0.11127979214161411, 'batch_size': 178}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.8159631599600499
0.5826262430950602
Epoch 11/200, Loss: 0.23055790379070318
0.6315472097750741
Epoch 21/200, Loss: 0.17225607126378095
0.6354209687022633
Epoch 31/200, Loss: 0.12560994106416518
0.6421959688596196
Epoch 41/200, Loss: 0.10195575131533238
0.6424350128339059
Epoch 51/200, Loss: 0.0957137392117427
0.6452171525050605
Epoch 61/200, Loss: 0.09318997718107241
0.6568700354083234
Epoch 71/200, Loss: 0.09326184526658975
0.6543762891897698
Epoch 81/200, Loss: 0.0922085579771262
0.6584206119679319
Epoch 91/200, Loss: 0.09272538777440786
0.6600989891659765
Epoch 101/200, Loss: 0.09184285453878917
0.6551662333676183
Epoch 111/200, Loss: 0.09208582040782158
0.6539647658567053
Epoch 121/200, Loss: 0.0916761914268136
0.6618302720214035
Epoch 131/200, Loss: 0.09180813597945067
0.6620100698338475
Epoch 141/200, Loss: 0.09240915920012273
0.6627543608896777
Epoch 151/200, Loss: 0.09169052999753219
0.6606712123593488
Epoch 161/200, Loss: 0.09130407869815826
0.661750763942

[I 2024-01-21 00:41:53,166] Trial 22 finished with value: 0.6641071882767094 and parameters: {'hidden_dim_h': 50, 'dropout': 0.10629154775895877, 'batch_size': 194}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.33559021663547745
0.588585365508307
Epoch 11/200, Loss: 0.14224366858454035
0.6380440368411718
Epoch 21/200, Loss: 0.10842173487538158
0.6526128994811088
Epoch 31/200, Loss: 0.09557208972107066
0.6531375450729909
Epoch 41/200, Loss: 0.09292850318816628
0.6571082564993146
Epoch 51/200, Loss: 0.09197594609000895
0.6570273015063466
Epoch 61/200, Loss: 0.09186012976535476
0.6583708490704652
Epoch 71/200, Loss: 0.09164626793106004
0.6556563463954603
Epoch 81/200, Loss: 0.09202639315978135
0.6592131825340909
Epoch 91/200, Loss: 0.09141584131682273
0.6620484525639306
Epoch 101/200, Loss: 0.09133194829567824
0.6604490108197401
Epoch 111/200, Loss: 0.09161423825391449
0.6643042622025189
Epoch 121/200, Loss: 0.09123703475930903
0.6607325660511123
Epoch 131/200, Loss: 0.09105092183788224
0.6562403219637052
Epoch 141/200, Loss: 0.09168603514680768
0.6598900380884274
Epoch 151/200, Loss: 0.0907295606661551
0.6581148882234596
Epoch 161/200, Loss: 0.09074559040588907
0.6576128447

[I 2024-01-21 00:43:00,203] Trial 23 finished with value: 0.6643042622025189 and parameters: {'hidden_dim_h': 19, 'dropout': 0.08719736196832131, 'batch_size': 199}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.9531237070377057
0.5902210020328287
Epoch 11/200, Loss: 0.27893198957810034
0.6404180493252857
Epoch 21/200, Loss: 0.22213531136512757
0.6417950834429996
Epoch 31/200, Loss: 0.18545893545334155
0.6367485161024894
Epoch 41/200, Loss: 0.15144769503520086
0.6462539043732173
Epoch 51/200, Loss: 0.12441447709615414
0.6425119432222811
Epoch 61/200, Loss: 0.10734854535414623
0.6483322322702536
Epoch 71/200, Loss: 0.09792319650833424
0.6544682999565128
Epoch 81/200, Loss: 0.0938111689228278
0.655629736461746
Epoch 91/200, Loss: 0.09164643127184648
0.6570407981588651
Epoch 101/200, Loss: 0.09117412784924873
0.657665124619455
Epoch 111/200, Loss: 0.0913112956743974
0.6599112405443712
Epoch 121/200, Loss: 0.09087567134545399
0.6578257297800824
Epoch 131/200, Loss: 0.09088976646845158
0.6592684076406102
Epoch 141/200, Loss: 0.09007787211583211
0.6515202502443604
Epoch 151/200, Loss: 0.09104624482301565
0.6614575360260426
Epoch 161/200, Loss: 0.09068129693086331
0.6585221073809

[I 2024-01-21 00:44:05,768] Trial 24 finished with value: 0.6614575360260426 and parameters: {'hidden_dim_h': 50, 'dropout': 0.0785653333466739, 'batch_size': 311}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.25347296237945555
0.5911266237804559
Epoch 11/200, Loss: 0.1328188705444336
0.6476363796734002
Epoch 21/200, Loss: 0.0997486199438572
0.6532854688818757
Epoch 31/200, Loss: 0.09288388922810555
0.6569361504084413
Epoch 41/200, Loss: 0.09204212546348572
0.6579852013836123
Epoch 51/200, Loss: 0.09159846715629101
0.6580959006698339
Epoch 61/200, Loss: 0.09145080961287022
0.6566711972748706
Epoch 71/200, Loss: 0.09082079395651817
0.6588307101000466
Epoch 81/200, Loss: 0.09099569663405419
0.6585972545668808
Epoch 91/200, Loss: 0.0909978474676609
0.6559474401439841
Epoch 101/200, Loss: 0.09078589238226414
0.6593775879308902
Epoch 111/200, Loss: 0.09152593828737736
0.6561630311318601
Epoch 121/200, Loss: 0.09100215300917626
0.6607492538028423
Epoch 131/200, Loss: 0.09027243256568909
0.6636394870186091
Epoch 141/200, Loss: 0.09061221487820148
0.659551591939583
Epoch 151/200, Loss: 0.09077442497015
0.6613367970696238
Epoch 161/200, Loss: 0.09028482090681791
0.656355728874171

[I 2024-01-21 00:45:12,361] Trial 25 finished with value: 0.6636394870186091 and parameters: {'hidden_dim_h': 19, 'dropout': 0.06903354406263186, 'batch_size': 200}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.4904497672641088
0.5709622447377571
Epoch 11/200, Loss: 0.11039950008745547
0.645379482215706
Epoch 21/200, Loss: 0.10068541548397175
0.6514385960233978
Epoch 31/200, Loss: 0.09509692317436612
0.6566827268259426
Epoch 41/200, Loss: 0.09444135301327579
0.6595357810712382
Epoch 51/200, Loss: 0.09333739630759709
0.6569901418310002
Epoch 61/200, Loss: 0.09330109213158568
0.658313377904834
Epoch 71/200, Loss: 0.0932069266481059
0.6607336695898741
Epoch 81/200, Loss: 0.0929300235535102
0.6610724764646451
Epoch 91/200, Loss: 0.09224149304880667
0.6594335328131395
Epoch 101/200, Loss: 0.09311656839160061
0.660185819056771
Epoch 111/200, Loss: 0.09264619096561715
0.6626819176698667
Epoch 121/200, Loss: 0.09277424878544277
0.6612435402817135
Epoch 131/200, Loss: 0.0917499158038664
0.6564338370611054
Epoch 141/200, Loss: 0.09204117835514129
0.6621414063858745
Epoch 151/200, Loss: 0.09175684914071724
0.6596898015266989
Epoch 161/200, Loss: 0.09221577447242837
0.659003694828124

[I 2024-01-21 00:46:58,868] Trial 26 finished with value: 0.662860082853707 and parameters: {'hidden_dim_h': 10, 'dropout': 0.1012239441304196, 'batch_size': 106}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.2137159526348114
0.5867632963688347
Epoch 11/200, Loss: 0.16150593236088753
0.6504910414263899
Epoch 21/200, Loss: 0.13074423968791962
0.6514122609555691
Epoch 31/200, Loss: 0.11162407845258712
0.6572069119104471
Epoch 41/200, Loss: 0.10119140855967998
0.6576041023581775
Epoch 51/200, Loss: 0.09544642511755227
0.6544078864250822
Epoch 61/200, Loss: 0.09297017827630043
0.6567055110387349
Epoch 71/200, Loss: 0.09166774433106184
0.6593992473415805
Epoch 81/200, Loss: 0.0914931071922183
0.6557272281186468
Epoch 91/200, Loss: 0.09072906933724881
0.6601414843836272
Epoch 101/200, Loss: 0.0905954385176301
0.6585211581616291
Epoch 111/200, Loss: 0.09105586130172014
0.6576464911706721
Epoch 121/200, Loss: 0.0911824343726039
0.661059740051926
Epoch 131/200, Loss: 0.09095117952674628
0.6609917047873604
Epoch 141/200, Loss: 0.09048560708761215
0.6575169249213463
Epoch 151/200, Loss: 0.09041484706103801
0.6624261204077985
Epoch 161/200, Loss: 0.09070511274039746
0.6610003181572

[I 2024-01-21 00:47:46,327] Trial 27 finished with value: 0.6624261204077985 and parameters: {'hidden_dim_h': 24, 'dropout': 0.14448239709961708, 'batch_size': 503}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.18537593304234393
0.5883090790088304
Epoch 11/200, Loss: 0.126389909097377
0.6395374994804713
Epoch 21/200, Loss: 0.10318856412435279
0.6435553800866467
Epoch 31/200, Loss: 0.09497773855486337
0.647546632382381
Epoch 41/200, Loss: 0.09240246816154789
0.6519230194328038
Epoch 51/200, Loss: 0.09222647394327556
0.6596890433751423
Epoch 61/200, Loss: 0.0916192309163949
0.655235569349208
Epoch 71/200, Loss: 0.09163970478317317
0.6579020206925321
Epoch 81/200, Loss: 0.09085828723276362
0.6546967569684646
Epoch 91/200, Loss: 0.09129202300134827
0.6570709976885142
Epoch 101/200, Loss: 0.09052376909291043
0.657293929918547
Epoch 111/200, Loss: 0.09066151959054611
0.6583726003206348
Epoch 121/200, Loss: 0.09023791704984273
0.6590210952254139
Epoch 131/200, Loss: 0.09009139469879515
0.659233751346487
Epoch 141/200, Loss: 0.09006470332250875
0.6593389493737376
Epoch 151/200, Loss: 0.0903494739357163
0.6602684466611964
Epoch 161/200, Loss: 0.0902487852555864
0.6591398532635174


[I 2024-01-21 00:48:52,357] Trial 28 finished with value: 0.6645458793041422 and parameters: {'hidden_dim_h': 50, 'dropout': 0.051449876716145114, 'batch_size': 295}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.1656998653303493
0.5999352753099766
Epoch 11/200, Loss: 0.11231541588450923
0.6490224216743234
Epoch 21/200, Loss: 0.09878857467662204
0.6539929186121287
Epoch 31/200, Loss: 0.09305763233340147
0.6550952407397133
Epoch 41/200, Loss: 0.09196043545098016
0.6521476415173193
Epoch 51/200, Loss: 0.09167922649419669
0.6566637801568476
Epoch 61/200, Loss: 0.0924372747540474
0.6553958705284919
Epoch 71/200, Loss: 0.0907663084340818
0.6580014892410342
Epoch 81/200, Loss: 0.09144922853870825
0.6570570202150808
Epoch 91/200, Loss: 0.09070896594361826
0.6588242337702669
Epoch 101/200, Loss: 0.09123099900104782
0.6584055261689785
Epoch 111/200, Loss: 0.09042210425391342
0.656742731679657
Epoch 121/200, Loss: 0.09074970808896152
0.6613970127318767
Epoch 131/200, Loss: 0.09071253900500861
0.6601141528546217
Epoch 141/200, Loss: 0.09037029020714038
0.65978735191621
Epoch 151/200, Loss: 0.0910526140395439
0.6636989677896461
Epoch 161/200, Loss: 0.09053971855477853
0.661402556439559

[I 2024-01-21 00:49:49,568] Trial 29 finished with value: 0.6636989677896461 and parameters: {'hidden_dim_h': 26, 'dropout': 0.08050356154703767, 'batch_size': 307}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.3358852515618007
0.5652930546100025
Epoch 11/200, Loss: 0.7035597786307335
0.6160570185778262
Epoch 21/200, Loss: 0.36788807933529216
0.6309053595683238
Epoch 31/200, Loss: 0.2125122770667076
0.6404797699998523
Epoch 41/200, Loss: 0.14969363311926523
0.6477370664106806
Epoch 51/200, Loss: 0.1286224757010738
0.6507967451404152
Epoch 61/200, Loss: 0.12082096965362628
0.6514629754496243
Epoch 71/200, Loss: 0.1192078199237585
0.651434333658102
Epoch 81/200, Loss: 0.11571204134573539
0.6521145743797616
Epoch 91/200, Loss: 0.1139233832557996
0.656968376752567
Epoch 101/200, Loss: 0.110396065749228
0.6588953623733357
Epoch 111/200, Loss: 0.10814946113775174
0.6551281254524076
Epoch 121/200, Loss: 0.1060979226604104
0.6563348874825616
Epoch 131/200, Loss: 0.10385701339691877
0.6582319991890555
Epoch 141/200, Loss: 0.10124878336985906
0.6586288917064262
Epoch 151/200, Loss: 0.09933270079394181
0.6568047010427788
Epoch 161/200, Loss: 0.09686470994104941
0.6579434574464151
Ep

[I 2024-01-21 00:50:32,420] Trial 30 finished with value: 0.6588953623733357 and parameters: {'hidden_dim_h': 19, 'dropout': 0.052476429742572696, 'batch_size': 860}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.29007680405830516
0.6050818806229795
Epoch 11/200, Loss: 0.14531678903376918
0.6355201694412307
Epoch 21/200, Loss: 0.1153984763498964
0.6497135407803873
Epoch 31/200, Loss: 0.10002606148007272
0.6449034127894779
Epoch 41/200, Loss: 0.09455994062725155
0.6515065592711672
Epoch 51/200, Loss: 0.0929705152908961
0.6536742878462515
Epoch 61/200, Loss: 0.0926110095333779
0.6537537946908102
Epoch 71/200, Loss: 0.09197954944838052
0.6561631268944658
Epoch 81/200, Loss: 0.09154275222413841
0.6550538552165198
Epoch 91/200, Loss: 0.0917591190543668
0.6587811646515113
Epoch 101/200, Loss: 0.09133047670468517
0.6643473608666853
Epoch 111/200, Loss: 0.09157052088057858
0.6572685281906255
Epoch 121/200, Loss: 0.09140176197578168
0.6579409167442727
Epoch 131/200, Loss: 0.09117633935021258
0.6611553906860095
Epoch 141/200, Loss: 0.09105221764452157
0.6552653986070153
Epoch 151/200, Loss: 0.09140999452478585
0.659339805615737
Epoch 161/200, Loss: 0.09121675044298172
0.6585173260466

[I 2024-01-21 00:51:44,884] Trial 31 finished with value: 0.6643473608666853 and parameters: {'hidden_dim_h': 50, 'dropout': 0.09720732237802182, 'batch_size': 231}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.23153561614453794
0.6008300018436304
Epoch 11/200, Loss: 0.13313417807221412
0.6463114989026256
Epoch 21/200, Loss: 0.10233527375385165
0.6527389428271148
Epoch 31/200, Loss: 0.09402233874425292
0.6531352867481056
Epoch 41/200, Loss: 0.09281963920220733
0.6532467073932091
Epoch 51/200, Loss: 0.09255632096901537
0.6500019820279471
Epoch 61/200, Loss: 0.09178531756624579
0.6547006429567014
Epoch 71/200, Loss: 0.09186054486781359
0.6600927647451088
Epoch 81/200, Loss: 0.09197448706254363
0.6524313397539205
Epoch 91/200, Loss: 0.09144329857081175
0.6597576737503597
Epoch 101/200, Loss: 0.09149350300431251
0.6550664368586133
Epoch 111/200, Loss: 0.09176386008039117
0.6570700979377099
Epoch 121/200, Loss: 0.09113864144310355
0.6568208517643777
Epoch 131/200, Loss: 0.0911646862514317
0.6627555581174129
Epoch 141/200, Loss: 0.0903590346686542
0.6556095599737553
Epoch 151/200, Loss: 0.09089858494699002
0.660162042867203
Epoch 161/200, Loss: 0.09139687279239297
0.65961633157

[I 2024-01-21 00:52:53,277] Trial 32 finished with value: 0.6627555581174129 and parameters: {'hidden_dim_h': 46, 'dropout': 0.09177460704880613, 'batch_size': 252}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.4152419088464795
0.5819844945179965
Epoch 11/200, Loss: 0.24718435244126755
0.6485731721047856
Epoch 21/200, Loss: 0.21186299938144107
0.6501879785790479
Epoch 31/200, Loss: 0.18101353491797592
0.6384288462905803
Epoch 41/200, Loss: 0.1535931071548751
0.6478913242028994
Epoch 51/200, Loss: 0.13344339529673258
0.65469327028188
Epoch 61/200, Loss: 0.11706288407246272
0.6567051993645124
Epoch 71/200, Loss: 0.10616116722424825
0.6605219255561298
Epoch 81/200, Loss: 0.09887496743238333
0.6601252007462999
Epoch 91/200, Loss: 0.09489176399780042
0.6595720069796585
Epoch 101/200, Loss: 0.09223983256202756
0.6616664199863339
Epoch 111/200, Loss: 0.09071418462377606
0.656350357816717
Epoch 121/200, Loss: 0.0897833989425139
0.6572381535935181
Epoch 131/200, Loss: 0.0899395915594968
0.6527900185302566
Epoch 141/200, Loss: 0.08974973947712869
0.658759832718393
Epoch 151/200, Loss: 0.09003105037140124
0.6616069106394153
Epoch 161/200, Loss: 0.0898955911397934
0.661896168868598
E

[I 2024-01-21 00:53:40,217] Trial 33 finished with value: 0.6624942446523087 and parameters: {'hidden_dim_h': 32, 'dropout': 0.06887967051886412, 'batch_size': 618}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.7336833404034984
0.5736544955362592
Epoch 11/200, Loss: 0.5371634272896514
0.6178926783494848
Epoch 21/200, Loss: 0.1856161726980793
0.6381071956401997
Epoch 31/200, Loss: 0.12516335808500953
0.6492861950695377
Epoch 41/200, Loss: 0.11751663745666037
0.6475117059622575
Epoch 51/200, Loss: 0.11208425538272274
0.6556432807387785
Epoch 61/200, Loss: 0.10803635813752
0.652606155168107
Epoch 71/200, Loss: 0.1040811368397304
0.6556881689146359
Epoch 81/200, Loss: 0.10016055618013654
0.6563864620590066
Epoch 91/200, Loss: 0.09663762152194977
0.6567545697759268
Epoch 101/200, Loss: 0.09427909492229929
0.6584608991710005
Epoch 111/200, Loss: 0.0925822942232599
0.6585403032070727
Epoch 121/200, Loss: 0.09173709473439626
0.6588481614326918
Epoch 131/200, Loss: 0.09111409056551602
0.6556940079087803
Epoch 141/200, Loss: 0.09034746687631218
0.6607302679114389
Epoch 151/200, Loss: 0.09028791210481099
0.6608309500387561
Epoch 161/200, Loss: 0.09010370911992326
0.661326433103724
E

[I 2024-01-21 00:54:36,371] Trial 34 finished with value: 0.661326433103724 and parameters: {'hidden_dim_h': 43, 'dropout': 0.06789059003682493, 'batch_size': 415}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.6046246279749954
0.6010888068551228
Epoch 11/200, Loss: 0.2122362548844856
0.6457146994562207
Epoch 21/200, Loss: 0.17844515463762117
0.6475828926785193
Epoch 31/200, Loss: 0.1502288255775184
0.6506721470948577
Epoch 41/200, Loss: 0.12647551128215956
0.6505406550423245
Epoch 51/200, Loss: 0.10972084719360921
0.6536581691029412
Epoch 61/200, Loss: 0.09963230697209374
0.6493869288792908
Epoch 71/200, Loss: 0.09485205014546712
0.6550275925363348
Epoch 81/200, Loss: 0.09312934206243147
0.6575065599990477
Epoch 91/200, Loss: 0.09185070936617099
0.6580392000232171
Epoch 101/200, Loss: 0.09130936076766566
0.6595926757834332
Epoch 111/200, Loss: 0.09165570571234352
0.6580030264483571
Epoch 121/200, Loss: 0.0917435440055111
0.6615930811283464
Epoch 131/200, Loss: 0.09112910246639921
0.6548449805650843
Epoch 141/200, Loss: 0.09082788542697304
0.6585035765393451
Epoch 151/200, Loss: 0.09119777316064165
0.66348778581182
Epoch 161/200, Loss: 0.09057160035560005
0.65903222762726

[I 2024-01-21 00:55:36,272] Trial 35 finished with value: 0.66348778581182 and parameters: {'hidden_dim_h': 48, 'dropout': 0.12151352057074247, 'batch_size': 351}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.9388635545163542
0.5638051539214888
Epoch 11/200, Loss: 0.8346528588114558
0.6109673838931482
Epoch 21/200, Loss: 0.3439708295706156
0.6334711343303031
Epoch 31/200, Loss: 0.17016987663668556
0.644503042309504
Epoch 41/200, Loss: 0.12632445004340764
0.6487191775638517
Epoch 51/200, Loss: 0.11834757593837944
0.6513085370948919
Epoch 61/200, Loss: 0.11519401258713491
0.6564584793316899
Epoch 71/200, Loss: 0.11129829428485923
0.6546410767740629
Epoch 81/200, Loss: 0.10795922315603979
0.6595781931183035
Epoch 91/200, Loss: 0.10633357171271299
0.656918075630435
Epoch 101/200, Loss: 0.10355862834163614
0.6545545186397155
Epoch 111/200, Loss: 0.09902815822813962
0.661008648205696
Epoch 121/200, Loss: 0.09800941195036914
0.6512657398886801
Epoch 131/200, Loss: 0.09565523025151845
0.6561604622241906
Epoch 141/200, Loss: 0.09399613053412051
0.6562253269644559
Epoch 151/200, Loss: 0.09239224263945141
0.6598842424335873
Epoch 161/200, Loss: 0.09204122544945897
0.65875243574377

[I 2024-01-21 00:56:27,581] Trial 36 finished with value: 0.661008648205696 and parameters: {'hidden_dim_h': 40, 'dropout': 0.14343209078466923, 'batch_size': 554}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.3123981894358345
0.584840832988326
Epoch 11/200, Loss: 0.1727222252799117
0.6482674756228756
Epoch 21/200, Loss: 0.14423949708757194
0.6491174253531049
Epoch 31/200, Loss: 0.12227944495237392
0.6494914495008586
Epoch 41/200, Loss: 0.1092064234873523
0.6454543877142671
Epoch 51/200, Loss: 0.09928197899590367
0.6495132843917979
Epoch 61/200, Loss: 0.09657298935496289
0.652523180085709
Epoch 71/200, Loss: 0.09413850987735002
0.6510467621561956
Epoch 81/200, Loss: 0.09364729763373085
0.6586804006579584
Epoch 91/200, Loss: 0.09353537533594214
0.6597246811974106
Epoch 101/200, Loss: 0.09605277718409248
0.6556996128852132
Epoch 111/200, Loss: 0.0917245014368192
0.6560413729138297
Epoch 121/200, Loss: 0.09503557614010313
0.6626654542888163
Epoch 131/200, Loss: 0.09098988512287969
0.6593097294292534
Epoch 141/200, Loss: 0.09216330767325732
0.6579245166465668
Epoch 151/200, Loss: 0.09165334183236827
0.660590293595608
Epoch 161/200, Loss: 0.09127601122726565
0.659001007652812

[I 2024-01-21 00:57:17,676] Trial 37 finished with value: 0.6639426757595589 and parameters: {'hidden_dim_h': 31, 'dropout': 0.21799635213893623, 'batch_size': 444}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.3925749712130603
0.5729308274795044
Epoch 11/200, Loss: 0.2076065207228941
0.6399844341088294
Epoch 21/200, Loss: 0.15215974344926722
0.6480811481895302
Epoch 31/200, Loss: 0.13851746741463156
0.6481645870927357
Epoch 41/200, Loss: 0.13329004671643763
0.6575695298812314
Epoch 51/200, Loss: 0.12889288979418137
0.6565805083272184
Epoch 61/200, Loss: 0.12466505695791806
0.6506494212287557
Epoch 71/200, Loss: 0.12047384065740249
0.6592811093367958
Epoch 81/200, Loss: 0.11635037248625475
0.6550833174275075
Epoch 91/200, Loss: 0.11234080966781168
0.6591972715304453
Epoch 101/200, Loss: 0.10891684057081447
0.6530039365846866
Epoch 111/200, Loss: 0.10555575919501922
0.6588208466634271
Epoch 121/200, Loss: 0.10275056300794377
0.6587953561347695
Epoch 131/200, Loss: 0.09968580743845772
0.6572781485507047
Epoch 141/200, Loss: 0.09768006249385722
0.6609729603000168
Epoch 151/200, Loss: 0.09615307169802048
0.6616991001851624
Epoch 161/200, Loss: 0.09392970011514776
0.6616081711

[I 2024-01-21 00:58:03,316] Trial 38 finished with value: 0.6622571601524879 and parameters: {'hidden_dim_h': 28, 'dropout': 0.08535619834972658, 'batch_size': 1178}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.689377946120042
0.006124380094287178
Epoch 11/200, Loss: 0.1559083240536543
0.6329962397825475
Epoch 21/200, Loss: 0.12764270328558408
0.6507958266223739
Epoch 31/200, Loss: 0.10953337085934786
0.6511359996128716
Epoch 41/200, Loss: 0.0973265294272166
0.6533123697851274
Epoch 51/200, Loss: 0.09310114968281526
0.6527385177484424
Epoch 61/200, Loss: 0.09185352099056428
0.6586300832164209
Epoch 71/200, Loss: 0.092193864687131
0.6586499173549164
Epoch 81/200, Loss: 0.09204997586516234
0.6548960057015873
Epoch 91/200, Loss: 0.09168461844898187
0.6574949487913337
Epoch 101/200, Loss: 0.09158141549963217
0.6565181962428668
Epoch 111/200, Loss: 0.09111315310001374
0.6582213333001646
Epoch 121/200, Loss: 0.0910470387683465
0.6599529374856727
Epoch 131/200, Loss: 0.09155042016735444
0.658880380866542
Epoch 141/200, Loss: 0.09129474254754874
0.6601356641468906
Epoch 151/200, Loss: 0.09165882989764214
0.656277511131218
Epoch 161/200, Loss: 0.09144118113013414
0.658169068078455

[I 2024-01-21 00:59:22,914] Trial 39 finished with value: 0.6626044099187203 and parameters: {'hidden_dim_h': 19, 'dropout': 0.05053358042914421, 'batch_size': 154}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.3573433041572571
0.5711565874427887
Epoch 11/200, Loss: 0.6627955098946889
0.6182641534178577
Epoch 21/200, Loss: 0.3686807870864868
0.6386702771008064
Epoch 31/200, Loss: 0.2675357560316722
0.6407784892506768
Epoch 41/200, Loss: 0.23674005667368572
0.6452236802179429
Epoch 51/200, Loss: 0.22073793808619183
0.6484531289082145
Epoch 61/200, Loss: 0.20651719669500987
0.6474705454612835
Epoch 71/200, Loss: 0.19211032291253408
0.642925573181756
Epoch 81/200, Loss: 0.17745494991540908
0.6497914864672073
Epoch 91/200, Loss: 0.16272933532794318
0.6481136023469032
Epoch 101/200, Loss: 0.14914352943499884
0.6533653067311289
Epoch 111/200, Loss: 0.13684213409821191
0.6523819872765829
Epoch 121/200, Loss: 0.1257300299902757
0.6507114251774844
Epoch 131/200, Loss: 0.11656925231218337
0.6485581890011333
Epoch 141/200, Loss: 0.108849319567283
0.6516831324079244
Epoch 151/200, Loss: 0.10283042192459106
0.6531592055838215
Epoch 161/200, Loss: 0.09850246012210846
0.6533457299108135

[I 2024-01-21 01:00:15,837] Trial 40 finished with value: 0.6578466553742527 and parameters: {'hidden_dim_h': 47, 'dropout': 0.0938448759548745, 'batch_size': 676}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.923232918748489
0.5830337475635011
Epoch 11/200, Loss: 0.23317077899208435
0.5999795824292579
Epoch 21/200, Loss: 0.15458823955402926
0.6262983252298192
Epoch 31/200, Loss: 0.13599155520877013
0.6277756617704713
Epoch 41/200, Loss: 0.11727724861926757
0.6444964705333968
Epoch 51/200, Loss: 0.1045911440339226
0.6400793564966786
Epoch 61/200, Loss: 0.09821542538702488
0.6535711634860171
Epoch 71/200, Loss: 0.09614388988568233
0.6499679108659
Epoch 81/200, Loss: 0.09669136263143557
0.6481317126143413
Epoch 91/200, Loss: 0.09492921786239514
0.6562556577666708
Epoch 101/200, Loss: 0.09561358657307349
0.6512487980123116
Epoch 111/200, Loss: 0.09555798697356994
0.653747337922309
Epoch 121/200, Loss: 0.094788305927068
0.6530228203751942
Epoch 131/200, Loss: 0.09497726887751085
0.6603366509597274
Epoch 141/200, Loss: 0.09461528607285939
0.6569144263921619
Epoch 151/200, Loss: 0.0939582136208908
0.6523006927899428
Epoch 161/200, Loss: 0.09471907950221346
0.6557871099592822
E

[I 2024-01-21 01:01:31,809] Trial 41 finished with value: 0.6603366509597274 and parameters: {'hidden_dim_h': 50, 'dropout': 0.11083142256151271, 'batch_size': 194}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.494804174524464
0.5924624828189489
Epoch 11/200, Loss: 0.23365966506200295
0.6391776426722843
Epoch 21/200, Loss: 0.173140918555325
0.6402680628054314
Epoch 31/200, Loss: 0.12973994822943047
0.6502134815489542
Epoch 41/200, Loss: 0.10602537042474093
0.6506288330948565
Epoch 51/200, Loss: 0.09673361347554481
0.6477782723426927
Epoch 61/200, Loss: 0.09311285778267743
0.6513187297302205
Epoch 71/200, Loss: 0.09290472254769443
0.6524341969388382
Epoch 81/200, Loss: 0.09199974287862647
0.6564046120469395
Epoch 91/200, Loss: 0.09188895448021693
0.6596986481690469
Epoch 101/200, Loss: 0.0919231238634619
0.6594612102654223
Epoch 111/200, Loss: 0.09149127269852651
0.6600276217774754
Epoch 121/200, Loss: 0.09150773368469656
0.6568225653741198
Epoch 131/200, Loss: 0.0914719015972255
0.662024273263064
Epoch 141/200, Loss: 0.09150299093086425
0.6612947020134801
Epoch 151/200, Loss: 0.09120964789635515
0.661399259105298
Epoch 161/200, Loss: 0.09118235754231883
0.6598415201844122

[I 2024-01-21 01:02:40,018] Trial 42 finished with value: 0.662024273263064 and parameters: {'hidden_dim_h': 50, 'dropout': 0.1262717194514617, 'batch_size': 275}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.3830198178104326
0.5989811606982177
Epoch 11/200, Loss: 0.190253396482006
0.6247968655445446
Epoch 21/200, Loss: 0.12354676264758203
0.6429773402233474
Epoch 31/200, Loss: 0.10116915514363962
0.6529664550717672
Epoch 41/200, Loss: 0.09489292308103804
0.6538216713819416
Epoch 51/200, Loss: 0.09306035921269772
0.654497291394846
Epoch 61/200, Loss: 0.09506232254937583
0.6559377979019009
Epoch 71/200, Loss: 0.09073339210932746
0.6538460440159517
Epoch 81/200, Loss: 0.09156127149860065
0.6613335756397434
Epoch 91/200, Loss: 0.09452375608916376
0.6484717561277761
Epoch 101/200, Loss: 0.0911586860413937
0.65853994318947
Epoch 111/200, Loss: 0.09378255618845716
0.6568891204264197
Epoch 121/200, Loss: 0.09210231220897507
0.6570652783970747
Epoch 131/200, Loss: 0.09178707533169027
0.652424601443952
Epoch 141/200, Loss: 0.09267943301329426
0.6571764825927957
Epoch 151/200, Loss: 0.09113270519118682
0.6569383816076393
Epoch 161/200, Loss: 0.09105516210490582
0.6583276273046494

[I 2024-01-21 01:03:52,341] Trial 43 finished with value: 0.6613335756397434 and parameters: {'hidden_dim_h': 44, 'dropout': 0.0634722263321642, 'batch_size': 198}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.575057913118334
0.5698698859514416
Epoch 11/200, Loss: 0.14264875567003862
0.6234157782093679
Epoch 21/200, Loss: 0.12264427186837837
0.6264044566548254
Epoch 31/200, Loss: 0.11110539912287869
0.6357246160175668
Epoch 41/200, Loss: 0.10397752808101142
0.6341071733671395
Epoch 51/200, Loss: 0.10228401339098589
0.6314175054871647
Epoch 61/200, Loss: 0.10272238431359405
0.6287267421276613
Epoch 71/200, Loss: 0.10360222598954813
0.6308663834420882
Epoch 81/200, Loss: 0.10402091620350952
0.6307439481004977
Epoch 91/200, Loss: 0.10356901235767264
0.6291098451354722
Epoch 101/200, Loss: 0.1036640507961387
0.630385543941264
Epoch 111/200, Loss: 0.10513112677344635
0.6243676739269328
Epoch 121/200, Loss: 0.10474526793209475
0.6243815242696679
Epoch 131/200, Loss: 0.10444066295428063
0.6266991669691978
Epoch 141/200, Loss: 0.1049268860091914
0.6264196797782496
Epoch 151/200, Loss: 0.1050194207189688
0.6238732746516078
Epoch 161/200, Loss: 0.10498484641091148
0.62326537211706

[I 2024-01-21 01:05:16,789] Trial 44 finished with value: 0.6357246160175668 and parameters: {'hidden_dim_h': 48, 'dropout': 0.07676675366852492, 'batch_size': 150}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.5339819888273876
0.5805758299710262
Epoch 11/200, Loss: 0.3136029483543502
0.6060350985697085
Epoch 21/200, Loss: 0.1719029845876826
0.6328250985264334
Epoch 31/200, Loss: 0.1540554774304231
0.6388453801199782
Epoch 41/200, Loss: 0.13709247836636174
0.6437507252514921
Epoch 51/200, Loss: 0.12011758382949564
0.642900598781979
Epoch 61/200, Loss: 0.10737478101832999
0.6478900129486154
Epoch 71/200, Loss: 0.09963520181675752
0.6563386420239677
Epoch 81/200, Loss: 0.09516939355267419
0.6561932490778165
Epoch 91/200, Loss: 0.09410237034575807
0.6533065871833733
Epoch 101/200, Loss: 0.09348996314737532
0.6555589593876461
Epoch 111/200, Loss: 0.09295213325983948
0.659104421625779
Epoch 121/200, Loss: 0.09227780583831999
0.6578928801587945
Epoch 131/200, Loss: 0.09317880496382713
0.6573347696671119
Epoch 141/200, Loss: 0.09244392450071043
0.6549490837708706
Epoch 151/200, Loss: 0.0931596357582344
0.6601536016852846
Epoch 161/200, Loss: 0.09261456380287807
0.658203832920198

[I 2024-01-21 01:06:21,309] Trial 45 finished with value: 0.6601536016852846 and parameters: {'hidden_dim_h': 41, 'dropout': 0.10055943206784788, 'batch_size': 281}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.2398184218576976
0.593677987412103
Epoch 11/200, Loss: 0.11078854928632359
0.6449177028551375
Epoch 21/200, Loss: 0.09981964217437493
0.6513429876177874
Epoch 31/200, Loss: 0.09447653751288142
0.6594456570302838
Epoch 41/200, Loss: 0.09347460173316054
0.652733508872808
Epoch 51/200, Loss: 0.09219446671860558
0.6589715607639888
Epoch 61/200, Loss: 0.09298660426021932
0.6492006204062486
Epoch 71/200, Loss: 0.0937276894410888
0.6531069191598934
Epoch 81/200, Loss: 0.09174695316251817
0.6565943920036738
Epoch 91/200, Loss: 0.09143511476097527
0.6571749712024545
Epoch 101/200, Loss: 0.09152343893771643
0.6574383961232376
Epoch 111/200, Loss: 0.09164822543715383
0.6569647537222079
Epoch 121/200, Loss: 0.09139165192187487
0.6606440844290452
Epoch 131/200, Loss: 0.09257232463294333
0.6556319089846886
Epoch 141/200, Loss: 0.09198442085103674
0.659244027324707
Epoch 151/200, Loss: 0.09154076252009842
0.6598808786630284
Epoch 161/200, Loss: 0.09136492685302273
0.6592648058839

[I 2024-01-21 01:07:27,658] Trial 46 finished with value: 0.6606440844290452 and parameters: {'hidden_dim_h': 38, 'dropout': 0.1163709363905121, 'batch_size': 222}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 2.1166732140949795
0.5639819442223893
Epoch 11/200, Loss: 0.722831095967974
0.6188272895410107
Epoch 21/200, Loss: 0.28131433443299364
0.6164655484578502
Epoch 31/200, Loss: 0.19108092545398644
0.6366233518120018
Epoch 41/200, Loss: 0.17341579044503824
0.6412362530028172
Epoch 51/200, Loss: 0.15836150784577643
0.6436165048297926
Epoch 61/200, Loss: 0.14215846279902117
0.6529555960408951
Epoch 71/200, Loss: 0.12665523455611297
0.6490487627189784
Epoch 81/200, Loss: 0.11414282582700253
0.6482156218857069
Epoch 91/200, Loss: 0.10440672588135515
0.6490851965720882
Epoch 101/200, Loss: 0.0985162824924503
0.6540862971166974
Epoch 111/200, Loss: 0.09434398729354143
0.6554856148767603
Epoch 121/200, Loss: 0.09269286798579353
0.6539311480236387
Epoch 131/200, Loss: 0.0927654096324529
0.6580631210337704
Epoch 141/200, Loss: 0.09208415089441198
0.6531921426143948
Epoch 151/200, Loss: 0.09202265899096217
0.6595785027646307
Epoch 161/200, Loss: 0.09145820659718343
0.6561912796204

[I 2024-01-21 01:08:29,044] Trial 47 finished with value: 0.6595785027646307 and parameters: {'hidden_dim_h': 49, 'dropout': 0.13195054420358499, 'batch_size': 362}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.5221870727377174
0.5966538125025685
Epoch 11/200, Loss: 0.1849889349606302
0.6292421822954873
Epoch 21/200, Loss: 0.11066111991250957
0.6351993883008055
Epoch 31/200, Loss: 0.09657010509644026
0.6478898385653419
Epoch 41/200, Loss: 0.09505199259262026
0.6530861594891957
Epoch 51/200, Loss: 0.09429386922698697
0.660668416421922
Epoch 61/200, Loss: 0.09413217399039386
0.6525816091954598
Epoch 71/200, Loss: 0.09410891042631349
0.6489068570938441
Epoch 81/200, Loss: 0.09312532021215668
0.6572569669151573
Epoch 91/200, Loss: 0.09350552938786554
0.6532762792338794
Epoch 101/200, Loss: 0.09267390185944092
0.6579499369725814
Epoch 111/200, Loss: 0.09279717843013781
0.65689300137738
Epoch 121/200, Loss: 0.09347819385153276
0.6529734993808658
Epoch 131/200, Loss: 0.09278922946548757
0.6539215155496564
Epoch 141/200, Loss: 0.09331723215219415
0.6589918811904315
Epoch 151/200, Loss: 0.09229587163362238
0.6581997109622295
Epoch 161/200, Loss: 0.09298812110482911
0.6560329824174

[I 2024-01-21 01:10:05,390] Trial 48 finished with value: 0.6611467488871683 and parameters: {'hidden_dim_h': 46, 'dropout': 0.14814016429557592, 'batch_size': 124}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.6031671600826716
0.5647336746159657
Epoch 11/200, Loss: 0.38260659272387876
0.6034188273022503
Epoch 21/200, Loss: 0.16615208756115477
0.6332030624461963
Epoch 31/200, Loss: 0.14471279425641237
0.639910140393766
Epoch 41/200, Loss: 0.13475561899653934
0.6475623399302279
Epoch 51/200, Loss: 0.12456194109330743
0.6514057897545555
Epoch 61/200, Loss: 0.11461441117828175
0.6568215693218958
Epoch 71/200, Loss: 0.10585476811659539
0.656215031630207
Epoch 81/200, Loss: 0.09963307605456498
0.6570619505432879
Epoch 91/200, Loss: 0.09605362720913806
0.6540201546141662
Epoch 101/200, Loss: 0.0940753941313695
0.6537247472791434
Epoch 111/200, Loss: 0.09340759227841587
0.6595390452726712
Epoch 121/200, Loss: 0.0933821043473179
0.6597121233215112
Epoch 131/200, Loss: 0.09272865344912319
0.6597786550300379
Epoch 141/200, Loss: 0.09237457975997763
0.6591123327155112
Epoch 151/200, Loss: 0.09287540677745464
0.6616211463284686
Epoch 161/200, Loss: 0.09237852907281811
0.6601966550189

[I 2024-01-21 01:10:58,731] Trial 49 finished with value: 0.6616211463284686 and parameters: {'hidden_dim_h': 16, 'dropout': 0.17744325290910806, 'batch_size': 343}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.706207883854707
0.5612027678935106
Epoch 11/200, Loss: 0.6166024419168631
0.6250310648709939
Epoch 21/200, Loss: 0.3162616652746995
0.6401016551920609
Epoch 31/200, Loss: 0.25748640081534785
0.6481661280143058
Epoch 41/200, Loss: 0.23238321642080942
0.644971440751244
Epoch 51/200, Loss: 0.20759741651515165
0.6450679435388521
Epoch 61/200, Loss: 0.18237218260765076
0.6418325948183562
Epoch 71/200, Loss: 0.15833015770961842
0.6452124434416455
Epoch 81/200, Loss: 0.13739185112838945
0.6493295372036493
Epoch 91/200, Loss: 0.11994829851513107
0.6514644912900828
Epoch 101/200, Loss: 0.10801780953382452
0.6505006032357331
Epoch 111/200, Loss: 0.09985284848759572
0.6434331596768855
Epoch 121/200, Loss: 0.09505950349072616
0.6591065875705379
Epoch 131/200, Loss: 0.09237205951164167
0.6552727452426603
Epoch 141/200, Loss: 0.09114653120438258
0.6563458666192562
Epoch 151/200, Loss: 0.09086825807268421
0.6599015889515524
Epoch 161/200, Loss: 0.0904372027143836
0.65928827670235

[I 2024-01-21 01:11:54,915] Trial 50 finished with value: 0.6630407739514899 and parameters: {'hidden_dim_h': 45, 'dropout': 0.09746758108130385, 'batch_size': 418}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.418580182393392
0.5774309812919158
Epoch 11/200, Loss: 0.45051982005437213
0.6292105526674353
Epoch 21/200, Loss: 0.18438729014661576
0.6409902188386966
Epoch 31/200, Loss: 0.1400639643271764
0.6489455149965522
Epoch 41/200, Loss: 0.132108806570371
0.6535671003091442
Epoch 51/200, Loss: 0.1259926935036977
0.6564005463300816
Epoch 61/200, Loss: 0.11943885650899676
0.652880374934646
Epoch 71/200, Loss: 0.11334341019392014
0.6564814893697277
Epoch 81/200, Loss: 0.1071564667754703
0.6549537281174792
Epoch 91/200, Loss: 0.10246729287836287
0.659076963934319
Epoch 101/200, Loss: 0.09831155488888423
0.6585528399000761
Epoch 111/200, Loss: 0.09579872737328211
0.6552128792321831
Epoch 121/200, Loss: 0.09333190669616064
0.6567399687660649
Epoch 131/200, Loss: 0.09238286680645413
0.6591887073575031
Epoch 141/200, Loss: 0.09209133601850933
0.6604805120279982
Epoch 151/200, Loss: 0.09179853813515769
0.6583800224744925
Epoch 161/200, Loss: 0.09159674412674373
0.6609116133010661


[I 2024-01-21 01:12:44,620] Trial 51 finished with value: 0.6634488292374645 and parameters: {'hidden_dim_h': 31, 'dropout': 0.22634204595040813, 'batch_size': 447}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.6684928689061141
0.5895293358890888
Epoch 11/200, Loss: 0.22537846136383893
0.6462395002880388
Epoch 21/200, Loss: 0.17614341127436337
0.6492840944360272
Epoch 31/200, Loss: 0.13514280346472088
0.6478523488759608
Epoch 41/200, Loss: 0.10923523028812758
0.6495572181169016
Epoch 51/200, Loss: 0.09816049520925778
0.6499999520755313
Epoch 61/200, Loss: 0.09443476114694666
0.6517286992849701
Epoch 71/200, Loss: 0.09360299241252062
0.6586546897543414
Epoch 81/200, Loss: 0.09285262681362105
0.6611378969309337
Epoch 91/200, Loss: 0.09305914073455625
0.659298510763847
Epoch 101/200, Loss: 0.09231457641211951
0.6581114289159631
Epoch 111/200, Loss: 0.09244072128359865
0.6574268026972324
Epoch 121/200, Loss: 0.09248658224213414
0.6602273990081668
Epoch 131/200, Loss: 0.09228432623714936
0.662611386304804
Epoch 141/200, Loss: 0.09207917268319828
0.6591905096444687
Epoch 151/200, Loss: 0.09236174676476455
0.6613592428515003
Epoch 161/200, Loss: 0.09192078378869266
0.65871793631

[I 2024-01-21 01:13:47,917] Trial 52 finished with value: 0.662611386304804 and parameters: {'hidden_dim_h': 25, 'dropout': 0.22730035096477588, 'batch_size': 245}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 2.274783631758903
0.5687897434692443
Epoch 11/200, Loss: 0.6602598606650509
0.38319214094943205
Epoch 21/200, Loss: 0.20960097837803968
0.6317992474047929
Epoch 31/200, Loss: 0.1645251185591541
0.6388587064716018
Epoch 41/200, Loss: 0.14892374646307818
0.6466727519263437
Epoch 51/200, Loss: 0.1366508581967496
0.648842545769424
Epoch 61/200, Loss: 0.12066946067472002
0.6478359733068595
Epoch 71/200, Loss: 0.1129605107343019
0.6538164081104354
Epoch 81/200, Loss: 0.10216321618254505
0.6567318059528086
Epoch 91/200, Loss: 0.0959383000188799
0.6527247993530938
Epoch 101/200, Loss: 0.09896927449240614
0.6563323047124808
Epoch 111/200, Loss: 0.09257485167081676
0.6590023519353223
Epoch 121/200, Loss: 0.09400288304731028
0.6584786620455199
Epoch 131/200, Loss: 0.09267386043472077
0.6556951543285041
Epoch 141/200, Loss: 0.09121947154513936
0.6527458919036255
Epoch 151/200, Loss: 0.09743405778461428
0.6603857715863561
Epoch 161/200, Loss: 0.09479397001551158
0.659123414026077

[I 2024-01-21 01:14:46,010] Trial 53 finished with value: 0.6603857715863561 and parameters: {'hidden_dim_h': 29, 'dropout': 0.21007261244270511, 'batch_size': 303}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.9997177010171869
0.5826331933046066
Epoch 11/200, Loss: 0.16279973826381597
0.6400500246296911
Epoch 21/200, Loss: 0.13502127133058697
0.650221671450511
Epoch 31/200, Loss: 0.12042595069395022
0.6468113404565655
Epoch 41/200, Loss: 0.10667312605662292
0.6542768266487189
Epoch 51/200, Loss: 0.09846836269906398
0.6593602231324918
Epoch 61/200, Loss: 0.09496086835861206
0.6569902868112659
Epoch 71/200, Loss: 0.09317683512240313
0.6584483343299269
Epoch 81/200, Loss: 0.09254304227534305
0.65811959765776
Epoch 91/200, Loss: 0.09277651994750741
0.6570340953686234
Epoch 101/200, Loss: 0.09257894921838568
0.6586621847486229
Epoch 111/200, Loss: 0.09305041074083092
0.6603389538438161
Epoch 121/200, Loss: 0.09197936809799645
0.6618152161718465
Epoch 131/200, Loss: 0.09172565682550494
0.6588439067339499
Epoch 141/200, Loss: 0.09224896727318174
0.6578256947222034
Epoch 151/200, Loss: 0.0927436916848247
0.6597986277243382
Epoch 161/200, Loss: 0.09273373184914
0.660151844312008


[I 2024-01-21 01:15:51,655] Trial 54 finished with value: 0.6618152161718465 and parameters: {'hidden_dim_h': 22, 'dropout': 0.2027327583642491, 'batch_size': 227}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.2540204966207966
0.603139958296499
Epoch 11/200, Loss: 0.1347761208890006
0.6416391922312092
Epoch 21/200, Loss: 0.10406002757372335
0.6467321816978674
Epoch 31/200, Loss: 0.09730713453609496
0.6524570050666165
Epoch 41/200, Loss: 0.09563212317880243
0.6572206164232459
Epoch 51/200, Loss: 0.0949816849315539
0.6526715770208359
Epoch 61/200, Loss: 0.09489418257726356
0.6581224891082202
Epoch 71/200, Loss: 0.09469266713131219
0.6549806228421704
Epoch 81/200, Loss: 0.09474793230765499
0.6547131495392969
Epoch 91/200, Loss: 0.09415784291923046
0.6587297494662601
Epoch 101/200, Loss: 0.09467669995501637
0.6557461970516343
Epoch 111/200, Loss: 0.09420528617920354
0.6578229255247855
Epoch 121/200, Loss: 0.09416971006430686
0.6612728929360909
Epoch 131/200, Loss: 0.09412914188578725
0.658693948215316
Epoch 141/200, Loss: 0.09322066471213475
0.6570875201196612
Epoch 151/200, Loss: 0.09455267590237781
0.655687160601441
Epoch 161/200, Loss: 0.09344269020948559
0.66051802706262

[I 2024-01-21 01:17:11,953] Trial 55 finished with value: 0.6612728929360909 and parameters: {'hidden_dim_h': 39, 'dropout': 0.2720808121230696, 'batch_size': 157}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 1.0585350995570157
0.5805116754304448
Epoch 11/200, Loss: 0.14464446269305406
0.6347657312350147
Epoch 21/200, Loss: 0.12554315635852054
0.651413554895616
Epoch 31/200, Loss: 0.10919642026445507
0.648079550189587
Epoch 41/200, Loss: 0.09920792584925626
0.6492482085053762
Epoch 51/200, Loss: 0.09558411509589812
0.6530930420109995
Epoch 61/200, Loss: 0.09444767091654044
0.654877650283696
Epoch 71/200, Loss: 0.09362394929723403
0.6552522888184552
Epoch 81/200, Loss: 0.09389714850524886
0.6555286124092561
Epoch 91/200, Loss: 0.0937367416588606
0.653107568558317
Epoch 101/200, Loss: 0.09364189167993259
0.6561547800222065
Epoch 111/200, Loss: 0.0940652254276571
0.653534243861236
Epoch 121/200, Loss: 0.09334181301889166
0.6606449050130493
Epoch 131/200, Loss: 0.0934758071284906
0.6597513737402791
Epoch 141/200, Loss: 0.09322924951536465
0.6563030794384441
Epoch 151/200, Loss: 0.09314061074921515
0.6551103509082357
Epoch 161/200, Loss: 0.09357245906000644
0.6590095026083401


[I 2024-01-21 01:18:25,998] Trial 56 finished with value: 0.6606449050130493 and parameters: {'hidden_dim_h': 36, 'dropout': 0.25104096935705544, 'batch_size': 177}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.9033773993292162
0.5811470459689302
Epoch 11/200, Loss: 0.2973910517269565
0.4855709374779051
Epoch 21/200, Loss: 0.2003259269460555
0.635568665612286
Epoch 31/200, Loss: 0.1713316029598636
0.6423723261626896
Epoch 41/200, Loss: 0.14347385639144528
0.6526514702860157
Epoch 51/200, Loss: 0.12138527980254542
0.6411874331334803
Epoch 61/200, Loss: 0.10616866054554139
0.6495396077099017
Epoch 71/200, Loss: 0.09736149878271165
0.6581199387519858
Epoch 81/200, Loss: 0.0931708198641577
0.6582227575819406
Epoch 91/200, Loss: 0.0918328664716213
0.6553691355197573
Epoch 101/200, Loss: 0.09150114859784803
0.652220996307692
Epoch 111/200, Loss: 0.09100799226472454
0.6591081537956961
Epoch 121/200, Loss: 0.0909195460619465
0.6588296443310218
Epoch 131/200, Loss: 0.09093838581635107
0.6578896516012993
Epoch 141/200, Loss: 0.09017590457393278
0.6619433516128423
Epoch 151/200, Loss: 0.09046160874347534
0.6564896006879489
Epoch 161/200, Loss: 0.09058043697187977
0.6568619720027068


[I 2024-01-21 01:19:24,102] Trial 57 finished with value: 0.6619433516128423 and parameters: {'hidden_dim_h': 33, 'dropout': 0.06320094922605343, 'batch_size': 326}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.3496309594780791
0.5908117361182196
Epoch 11/200, Loss: 0.20374067069268695
0.643211757534178
Epoch 21/200, Loss: 0.17086475649300745
0.6477095923319792
Epoch 31/200, Loss: 0.1412749451165106
0.6503726788795439
Epoch 41/200, Loss: 0.11977880608801748
0.6545494309413074
Epoch 51/200, Loss: 0.1056527165221233
0.6572665898273619
Epoch 61/200, Loss: 0.09764005083079431
0.6581996023942589
Epoch 71/200, Loss: 0.09438008274517808
0.6598746093098612
Epoch 81/200, Loss: 0.09238351866895077
0.6552764269633765
Epoch 91/200, Loss: 0.09137318414800308
0.6626530324160261
Epoch 101/200, Loss: 0.0913698690779069
0.6629798719773192
Epoch 111/200, Loss: 0.09138331781415378
0.6603154900924286
Epoch 121/200, Loss: 0.09125879348493089
0.6595958907818107
Epoch 131/200, Loss: 0.09187748458455591
0.6611444424603664
Epoch 141/200, Loss: 0.09109912374440361
0.6585883798671172
Epoch 151/200, Loss: 0.09081252708154566
0.6585384640308548
Epoch 161/200, Loss: 0.0911487256195031
0.65970431143611

[I 2024-01-21 01:20:14,075] Trial 58 finished with value: 0.6629798719773192 and parameters: {'hidden_dim_h': 22, 'dropout': 0.18491669694308688, 'batch_size': 397}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.6641053274348753
0.5829714576130544
Epoch 11/200, Loss: 0.11555512698750998
0.6344963642366354
Epoch 21/200, Loss: 0.1012447745206967
0.6364756681926456
Epoch 31/200, Loss: 0.09796327030538914
0.6472913418554734
Epoch 41/200, Loss: 0.1002577843153896
0.6520418369483022
Epoch 51/200, Loss: 0.09702678754850848
0.6539072018777083
Epoch 61/200, Loss: 0.09496426863137201
0.6547480078389878
Epoch 71/200, Loss: 0.09823670369296816
0.6495940960440513
Epoch 81/200, Loss: 0.09782180440935058
0.6540887178443408
Epoch 91/200, Loss: 0.09471194857928023
0.6512129956974081
Epoch 101/200, Loss: 0.09466338554518906
0.6488284086069065
Epoch 111/200, Loss: 0.09746259458400497
0.656208504889275
Epoch 121/200, Loss: 0.09505477547645569
0.6582761004701377
Epoch 131/200, Loss: 0.09638778859721356
0.6518741037788188
Epoch 141/200, Loss: 0.09565461782654326
0.6551294330234415
Epoch 151/200, Loss: 0.09472002652497148
0.6538659235103842
Epoch 161/200, Loss: 0.09521227622002214
0.655053415981

[I 2024-01-21 01:22:07,417] Trial 59 finished with value: 0.6582761004701377 and parameters: {'hidden_dim_h': 47, 'dropout': 0.07368735879185534, 'batch_size': 101}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.36672692994276684
0.5806541955316825
Epoch 11/200, Loss: 0.18797696097975686
0.6425254629230366
Epoch 21/200, Loss: 0.16294964864140465
0.6430839504933138
Epoch 31/200, Loss: 0.1392937476436297
0.6444463815349044
Epoch 41/200, Loss: 0.12135424784251622
0.648934874146338
Epoch 51/200, Loss: 0.10893087408372334
0.6510224578428881
Epoch 61/200, Loss: 0.10070786642886344
0.6557988139548364
Epoch 71/200, Loss: 0.09648657749806132
0.6538596899775467
Epoch 81/200, Loss: 0.09534931342516627
0.6571161502870372
Epoch 91/200, Loss: 0.09449355925122897
0.6581616223742399
Epoch 101/200, Loss: 0.09404642791265533
0.6536375839971617
Epoch 111/200, Loss: 0.0933440513908863
0.6557602871770881
Epoch 121/200, Loss: 0.09328835297908102
0.6569472433395828
Epoch 131/200, Loss: 0.0928442579294954
0.6604803764867675
Epoch 141/200, Loss: 0.09271735236758277
0.6596560273360058
Epoch 151/200, Loss: 0.09314028776827313
0.6586292769347676
Epoch 161/200, Loss: 0.0924971733419668
0.6605874354526

[I 2024-01-21 01:22:59,606] Trial 60 finished with value: 0.6619213025499039 and parameters: {'hidden_dim_h': 36, 'dropout': 0.3003301219106793, 'batch_size': 486}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.2543695315166756
0.578913953924608
Epoch 11/200, Loss: 0.12722837462745332
0.6518304838072743
Epoch 21/200, Loss: 0.09830212827633929
0.6534879952821148
Epoch 31/200, Loss: 0.09322968428885495
0.6597172619337079
Epoch 41/200, Loss: 0.0924067605562784
0.6603391533319438
Epoch 51/200, Loss: 0.09230233942744909
0.656348770790227
Epoch 61/200, Loss: 0.09168632093954969
0.657261023201668
Epoch 71/200, Loss: 0.09165506258055016
0.6593489493786343
Epoch 81/200, Loss: 0.09151703422820126
0.6578208310139205
Epoch 91/200, Loss: 0.0913692884216154
0.6608416837708128
Epoch 101/200, Loss: 0.0911344887205848
0.6545286310091532
Epoch 111/200, Loss: 0.0906443297173138
0.6598246095152929
Epoch 121/200, Loss: 0.09164786373299581
0.6601536618245242
Epoch 131/200, Loss: 0.0915157252025825
0.6619040266338447
Epoch 141/200, Loss: 0.09082995541393757
0.6619038570073241
Epoch 151/200, Loss: 0.09085011413251912
0.6613466530623988
Epoch 161/200, Loss: 0.09120113809627516
0.6630460963453313


[I 2024-01-21 01:24:09,881] Trial 61 finished with value: 0.6630460963453313 and parameters: {'hidden_dim_h': 10, 'dropout': 0.08769043516835447, 'batch_size': 186}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.8327641181043677
0.5756677709905017
Epoch 11/200, Loss: 0.19732997042907252
0.6288291973021384
Epoch 21/200, Loss: 0.16322651485333572
0.649635995044707
Epoch 31/200, Loss: 0.13773386301221074
0.6506265712889429
Epoch 41/200, Loss: 0.11670475714915507
0.6559196252986055
Epoch 51/200, Loss: 0.10261148395570549
0.6553708688200913
Epoch 61/200, Loss: 0.09551409007729711
0.6589973281889485
Epoch 71/200, Loss: 0.09261583989939175
0.661954511077246
Epoch 81/200, Loss: 0.09171294853896708
0.6590530134621679
Epoch 91/200, Loss: 0.09138678910361754
0.6619201311739651
Epoch 101/200, Loss: 0.09138916825523248
0.6592474508993158
Epoch 111/200, Loss: 0.09128237233774082
0.6626790221203934
Epoch 121/200, Loss: 0.09148527530802263
0.6604455798711956
Epoch 131/200, Loss: 0.09115941580888387
0.6637395857003815
Epoch 141/200, Loss: 0.09033684231139519
0.6611807007310886
Epoch 151/200, Loss: 0.09052970632910728
0.6545490585263328
Epoch 161/200, Loss: 0.09107649940493945
0.66112062189

[I 2024-01-21 01:25:09,698] Trial 62 finished with value: 0.6637395857003815 and parameters: {'hidden_dim_h': 16, 'dropout': 0.1060355112992248, 'batch_size': 272}. Best is trial 11 with value: 0.664822187307751.


Epoch 1/200, Loss: 0.7252618710199992
0.575632542956028
Epoch 11/200, Loss: 0.20739333848158517
0.6407934895648955
Epoch 21/200, Loss: 0.17023743073145547
0.6469034094757414
Epoch 31/200, Loss: 0.13764725774526596
0.6468858817757768
Epoch 41/200, Loss: 0.11384428232908249
0.6540172031838597
Epoch 51/200, Loss: 0.09896984050671259
0.6528634078522033
Epoch 61/200, Loss: 0.09333584815263749
0.6557649968436252
Epoch 71/200, Loss: 0.0914405220746994
0.6611224160148298
Epoch 81/200, Loss: 0.0908486599723498
0.66146620599252
Epoch 91/200, Loss: 0.09038688153028489
0.6628384575956994
Epoch 101/200, Loss: 0.09042621403932571
0.6594190481394927
Epoch 111/200, Loss: 0.0903575712442398
0.6572469377804571
Epoch 121/200, Loss: 0.09035090178251266
0.6586538569448186
Epoch 131/200, Loss: 0.0905501585205396
0.6604558330586633
Epoch 141/200, Loss: 0.09018180867036184
0.6614998801336553
Epoch 151/200, Loss: 0.09005819837252299
0.6611381767282292
Epoch 161/200, Loss: 0.0900293684999148
0.6608168456297041


[I 2024-01-21 01:26:10,093] Trial 63 finished with value: 0.6648751940069384 and parameters: {'hidden_dim_h': 15, 'dropout': 0.06118622949287433, 'batch_size': 267}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.23602194834005583
0.5959861631987283
Epoch 11/200, Loss: 0.1140040594797868
0.6485314780868998
Epoch 21/200, Loss: 0.09482906435753082
0.6504241487124968
Epoch 31/200, Loss: 0.09253307124534688
0.6555744287708194
Epoch 41/200, Loss: 0.09210610155250643
0.6536031086098432
Epoch 51/200, Loss: 0.09233337674628604
0.6569304382789664
Epoch 61/200, Loss: 0.09143438289215515
0.655651018845651
Epoch 71/200, Loss: 0.09185788736164154
0.6580537520645638
Epoch 81/200, Loss: 0.0917752003492592
0.6605150779704638
Epoch 91/200, Loss: 0.0914678760393933
0.6579878565977308
Epoch 101/200, Loss: 0.09169879946466926
0.657847127988667
Epoch 111/200, Loss: 0.09127518399195238
0.656716353448138
Epoch 121/200, Loss: 0.09143707539130758
0.6572546394284704
Epoch 131/200, Loss: 0.09119203019809057
0.6608912512339299
Epoch 141/200, Loss: 0.09122917764670366
0.6559325596505569
Epoch 151/200, Loss: 0.09123943123471487
0.6615944543607613
Epoch 161/200, Loss: 0.09108646589142459
0.65823676686634

[I 2024-01-21 01:27:35,927] Trial 64 finished with value: 0.6615944543607613 and parameters: {'hidden_dim_h': 21, 'dropout': 0.05620484217693346, 'batch_size': 140}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.21936700212699112
0.5867316002858424
Epoch 11/200, Loss: 0.12585449867671536
0.6489033656626169
Epoch 21/200, Loss: 0.09866372335662124
0.6527920210008089
Epoch 31/200, Loss: 0.0925172675521143
0.6566430100893055
Epoch 41/200, Loss: 0.09196797982659391
0.6546101695738338
Epoch 51/200, Loss: 0.09135574518993336
0.6537054280223266
Epoch 61/200, Loss: 0.09079278020128127
0.6603553879005919
Epoch 71/200, Loss: 0.09097433258448878
0.658739477617286
Epoch 81/200, Loss: 0.09136614748226699
0.6625426369248223
Epoch 91/200, Loss: 0.09151157384277672
0.6621320128302919
Epoch 101/200, Loss: 0.09069831709387483
0.6633989166699388
Epoch 111/200, Loss: 0.09064471833808448
0.6622285517941845
Epoch 121/200, Loss: 0.09025395613524222
0.6609624745665719
Epoch 131/200, Loss: 0.09133016270014548
0.663833978384517
Epoch 141/200, Loss: 0.09083320312602546
0.6617489434014878
Epoch 151/200, Loss: 0.090305414571557
0.6629827226231167
Epoch 161/200, Loss: 0.09000839144792608
0.6623704580527

[I 2024-01-21 01:28:40,310] Trial 65 finished with value: 0.663833978384517 and parameters: {'hidden_dim_h': 12, 'dropout': 0.06343548213948322, 'batch_size': 217}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.9419005342892238
0.558456695456275
Epoch 11/200, Loss: 0.5319127511410486
0.6226422292826691
Epoch 21/200, Loss: 0.3435204852195013
0.6355142652865955
Epoch 31/200, Loss: 0.27016121858642217
0.6387207007606197
Epoch 41/200, Loss: 0.24263949550333477
0.647535114059876
Epoch 51/200, Loss: 0.22782989839712778
0.645326901427082
Epoch 61/200, Loss: 0.2164038916428884
0.6462178174266378
Epoch 71/200, Loss: 0.20402054559616817
0.6478553117148922
Epoch 81/200, Loss: 0.19155135466938927
0.6523311477196015
Epoch 91/200, Loss: 0.17977919110230037
0.6496171073159008
Epoch 101/200, Loss: 0.16822008149964468
0.6507844279292344
Epoch 111/200, Loss: 0.15687499230816251
0.6549738976579461
Epoch 121/200, Loss: 0.1472986134744826
0.652132062605774
Epoch 131/200, Loss: 0.13580953897464842
0.654444918323083
Epoch 141/200, Loss: 0.12817803202640443
0.656857195683367
Epoch 151/200, Loss: 0.12028084979170844
0.6551811715832104
Epoch 161/200, Loss: 0.11348220989817664
0.6567022127473299
Ep

[I 2024-01-21 01:29:21,876] Trial 66 finished with value: 0.6586310710628405 and parameters: {'hidden_dim_h': 15, 'dropout': 0.08405585296309387, 'batch_size': 987}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.35362385639122557
0.6023521815414907
Epoch 11/200, Loss: 0.20860297019992555
0.6356131804456804
Epoch 21/200, Loss: 0.14150289839931895
0.6498173893400633
Epoch 31/200, Loss: 0.10881889398608889
0.6528215423287907
Epoch 41/200, Loss: 0.09717768175261361
0.6487611818788933
Epoch 51/200, Loss: 0.09324994438460894
0.6582878343169223
Epoch 61/200, Loss: 0.09225432713116918
0.6586569345820563
Epoch 71/200, Loss: 0.09190003648400306
0.659814461007171
Epoch 81/200, Loss: 0.09147859673414911
0.6563536695138065
Epoch 91/200, Loss: 0.0917472643511636
0.6590377202454268
Epoch 101/200, Loss: 0.09141650082809584
0.6599110514796612
Epoch 111/200, Loss: 0.09193240212542671
0.6590881080776193
Epoch 121/200, Loss: 0.09151502943464689
0.6591858609329438
Epoch 131/200, Loss: 0.09103105078850474
0.6566955549084029
Epoch 141/200, Loss: 0.09208147451281548
0.6604185588058873
Epoch 151/200, Loss: 0.09069776449884687
0.6593032966741974
Epoch 161/200, Loss: 0.09098732801420348
0.6572045665

[I 2024-01-21 01:30:20,964] Trial 67 finished with value: 0.6638729963625445 and parameters: {'hidden_dim_h': 30, 'dropout': 0.15606101907603753, 'batch_size': 286}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.5844234686344862
0.5877196794104136
Epoch 11/200, Loss: 0.2059111397713423
0.6334958773935601
Epoch 21/200, Loss: 0.1635671505704522
0.6468972163549037
Epoch 31/200, Loss: 0.12835137452930212
0.642656935464459
Epoch 41/200, Loss: 0.10793248619884252
0.6454293363263379
Epoch 51/200, Loss: 0.09865169478580356
0.6529041080080091
Epoch 61/200, Loss: 0.09603282734751702
0.6528599631581512
Epoch 71/200, Loss: 0.09554681116715073
0.6504999258833288
Epoch 81/200, Loss: 0.09430637089535594
0.6535215336224574
Epoch 91/200, Loss: 0.0947044052183628
0.6553189078106642
Epoch 101/200, Loss: 0.0947845233604312
0.654502686982646
Epoch 111/200, Loss: 0.09469304215162992
0.6535845987437622
Epoch 121/200, Loss: 0.09412161437794567
0.6582246178572785
Epoch 131/200, Loss: 0.09397572865709662
0.6552907902891436
Epoch 141/200, Loss: 0.09383687553927303
0.6548448375205672
Epoch 151/200, Loss: 0.09356250734999776
0.6566831622190051
Epoch 161/200, Loss: 0.0936956387013197
0.6593477171645438

[I 2024-01-21 01:31:31,359] Trial 68 finished with value: 0.6611550194832663 and parameters: {'hidden_dim_h': 49, 'dropout': 0.32931450430504355, 'batch_size': 250}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.49127331574757893
0.5802698104812241
Epoch 11/200, Loss: 0.12786232978105544
0.6526746888371995
Epoch 21/200, Loss: 0.10685640275478363
0.6540134888776116
Epoch 31/200, Loss: 0.10273905048767726
0.6574784666099732
Epoch 41/200, Loss: 0.09896358052889506
0.6537525839773336
Epoch 51/200, Loss: 0.09593013806475534
0.6562180890748331
Epoch 61/200, Loss: 0.09391145573721991
0.6613628635978572
Epoch 71/200, Loss: 0.09242561923133003
0.6540412745668762
Epoch 81/200, Loss: 0.09104064553976059
0.6589762034481705
Epoch 91/200, Loss: 0.09040375898281733
0.6630498805381358
Epoch 101/200, Loss: 0.09054477545950147
0.6591963666787305
Epoch 111/200, Loss: 0.09031027307113011
0.662076152498309
Epoch 121/200, Loss: 0.08997362421618568
0.6618275270381244
Epoch 131/200, Loss: 0.0895843740966585
0.661789063701777
Epoch 141/200, Loss: 0.08956313348478741
0.6607872000869465
Epoch 151/200, Loss: 0.09013984468248155
0.6611324406409751
Epoch 161/200, Loss: 0.08935780425866445
0.65962985226

[I 2024-01-21 01:32:18,434] Trial 69 finished with value: 0.6630498805381358 and parameters: {'hidden_dim_h': 12, 'dropout': 0.060215868962143426, 'batch_size': 447}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.1315127048227522
0.5739707186099109
Epoch 11/200, Loss: 0.3997315673364533
0.6292478875506434
Epoch 21/200, Loss: 0.16951446359356245
0.6395670966539239
Epoch 31/200, Loss: 0.12019627913832664
0.6496524699103666
Epoch 41/200, Loss: 0.11192849609586927
0.6551390917301751
Epoch 51/200, Loss: 0.10900276650985082
0.6518763458757423
Epoch 61/200, Loss: 0.10624435688886377
0.655015795412983
Epoch 71/200, Loss: 0.10372978717916542
0.6615499410791491
Epoch 81/200, Loss: 0.1011420138594177
0.6570741616237036
Epoch 91/200, Loss: 0.09803764253026909
0.6585487519730265
Epoch 101/200, Loss: 0.09573363699018955
0.6588649110820206
Epoch 111/200, Loss: 0.09382454802592595
0.6598150530375824
Epoch 121/200, Loss: 0.0924847283297115
0.6595433280070105
Epoch 131/200, Loss: 0.0915213158975045
0.65709882043964
Epoch 141/200, Loss: 0.09072152587274711
0.6591713491658083
Epoch 151/200, Loss: 0.09008350347479184
0.6628963685465198
Epoch 161/200, Loss: 0.08975537845657931
0.6549527185479193

[I 2024-01-21 01:33:05,690] Trial 70 finished with value: 0.6628963685465198 and parameters: {'hidden_dim_h': 27, 'dropout': 0.07390686188472614, 'batch_size': 564}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.5587950468063354
0.5957422137077324
Epoch 11/200, Loss: 0.13699163954172816
0.6465194747422983
Epoch 21/200, Loss: 0.12309068675552096
0.6476822588795295
Epoch 31/200, Loss: 0.11114132862005915
0.6516281712898853
Epoch 41/200, Loss: 0.10225896164774895
0.6500825895204341
Epoch 51/200, Loss: 0.09614816318665231
0.6524546539685144
Epoch 61/200, Loss: 0.0932050734758377
0.6556167774912584
Epoch 71/200, Loss: 0.09247377110379083
0.6584213482491467
Epoch 81/200, Loss: 0.09151000029274396
0.655933054790537
Epoch 91/200, Loss: 0.09228933049099786
0.6603521358529825
Epoch 101/200, Loss: 0.09196176518286978
0.6573805281262671
Epoch 111/200, Loss: 0.09160649489079203
0.6627745033171779
Epoch 121/200, Loss: 0.09149942110691751
0.6618678162267907
Epoch 131/200, Loss: 0.0916524734880243
0.6619945259068812
Epoch 141/200, Loss: 0.09139247770820345
0.6573918904637724
Epoch 151/200, Loss: 0.0910193579537528
0.6586120508045926
Epoch 161/200, Loss: 0.09144818612507412
0.6567618359902

[I 2024-01-21 01:34:04,720] Trial 71 finished with value: 0.6627745033171779 and parameters: {'hidden_dim_h': 30, 'dropout': 0.15130508128519482, 'batch_size': 287}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.1824669358630975
0.5975069680521529
Epoch 11/200, Loss: 0.12417304875950018
0.6483223089580605
Epoch 21/200, Loss: 0.10197299520174662
0.6556837781465
Epoch 31/200, Loss: 0.09406669549643994
0.654523003875693
Epoch 41/200, Loss: 0.09159183725714684
0.6635016944681994
Epoch 51/200, Loss: 0.09092137801150481
0.6606322511631934
Epoch 61/200, Loss: 0.09048902690410614
0.6618975139545145
Epoch 71/200, Loss: 0.08977736427138248
0.6559139318954034
Epoch 81/200, Loss: 0.09046306734283766
0.6554888693930533
Epoch 91/200, Loss: 0.08993012917538484
0.6602148902801619
Epoch 101/200, Loss: 0.09039838512738546
0.660299675501479
Epoch 111/200, Loss: 0.09095392649372419
0.6624937337128484
Epoch 121/200, Loss: 0.08981654892365137
0.6639634827545203
Epoch 131/200, Loss: 0.08979281609257063
0.6588991150671097
Epoch 141/200, Loss: 0.08967916977902253
0.6631763172904186
Epoch 151/200, Loss: 0.08979120440781116
0.6557121607097214
Epoch 161/200, Loss: 0.09002497630814711
0.66051588586383

[I 2024-01-21 01:34:58,486] Trial 72 finished with value: 0.6639634827545203 and parameters: {'hidden_dim_h': 18, 'dropout': 0.05019785264817972, 'batch_size': 338}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.0735136641830694
0.5769097108107715
Epoch 11/200, Loss: 0.1874587745940099
0.6364244638903133
Epoch 21/200, Loss: 0.10153511557422701
0.648623350758844
Epoch 31/200, Loss: 0.0971157085455832
0.6547575053807992
Epoch 41/200, Loss: 0.09454330124083113
0.6522666752749484
Epoch 51/200, Loss: 0.09446470121868321
0.6522122697458664
Epoch 61/200, Loss: 0.09293097660678332
0.6591554487557465
Epoch 71/200, Loss: 0.0920534710415074
0.6607185093153644
Epoch 81/200, Loss: 0.0906941402764594
0.6605140489959186
Epoch 91/200, Loss: 0.09069420873630242
0.6615784389926893
Epoch 101/200, Loss: 0.09083238964686628
0.6597920045733565
Epoch 111/200, Loss: 0.08992825619509963
0.6612373262694272
Epoch 121/200, Loss: 0.09027603757186015
0.659088578188084
Epoch 131/200, Loss: 0.09026441307830028
0.6589715101355106
Epoch 141/200, Loss: 0.08975790575390956
0.6602214040030564
Epoch 151/200, Loss: 0.09124685848345522
0.6607742484158943
Epoch 161/200, Loss: 0.0905947636385433
0.6626964118330062

[I 2024-01-21 01:35:52,752] Trial 73 finished with value: 0.6631429392067743 and parameters: {'hidden_dim_h': 18, 'dropout': 0.05278177340747934, 'batch_size': 333}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.36394391896633
0.5947448163551724
Epoch 11/200, Loss: 0.2040573272567529
0.6467689241149511
Epoch 21/200, Loss: 0.1716961760360461
0.6479723793577017
Epoch 31/200, Loss: 0.14179168469630754
0.653190935893377
Epoch 41/200, Loss: 0.11971708702353331
0.6497774923360866
Epoch 51/200, Loss: 0.10468549481951274
0.6465718952944892
Epoch 61/200, Loss: 0.09698991964642818
0.6558922448383319
Epoch 71/200, Loss: 0.09341940111838855
0.6572399245253917
Epoch 81/200, Loss: 0.09049760048779157
0.6603269173340259
Epoch 91/200, Loss: 0.09032869353317298
0.6578854184384627
Epoch 101/200, Loss: 0.089854353465713
0.6603921609159995
Epoch 111/200, Loss: 0.09059486265939015
0.6597576640981954
Epoch 121/200, Loss: 0.08966805871862632
0.6637260112844451
Epoch 131/200, Loss: 0.09028208470688416
0.6582506954908348
Epoch 141/200, Loss: 0.08939073507029277
0.6594335283278483
Epoch 151/200, Loss: 0.09008237848488185
0.6610831469369419
Epoch 161/200, Loss: 0.09037917393904465
0.6638288931795367

[I 2024-01-21 01:36:42,882] Trial 74 finished with value: 0.6638288931795367 and parameters: {'hidden_dim_h': 21, 'dropout': 0.07446171377358309, 'batch_size': 391}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.0610425331619349
0.5850370842543751
Epoch 11/200, Loss: 0.26476919132002286
0.5521715783632664
Epoch 21/200, Loss: 0.19058857054522868
0.6268145071516804
Epoch 31/200, Loss: 0.14992735091220127
0.6463711301460245
Epoch 41/200, Loss: 0.11814985491251678
0.6529134350390994
Epoch 51/200, Loss: 0.100702227501387
0.6529436494802733
Epoch 61/200, Loss: 0.0938790086447523
0.6553439114787113
Epoch 71/200, Loss: 0.09179994204405988
0.6576243206928429
Epoch 81/200, Loss: 0.09143611219491851
0.6588738188705451
Epoch 91/200, Loss: 0.09163401560502106
0.6582098517393665
Epoch 101/200, Loss: 0.09061936012814555
0.661103091170859
Epoch 111/200, Loss: 0.09077296422773533
0.659528616867143
Epoch 121/200, Loss: 0.09077380991049028
0.6601790497817748
Epoch 131/200, Loss: 0.09106287619705951
0.663669714001661
Epoch 141/200, Loss: 0.09051406835572104
0.6591376957036131
Epoch 151/200, Loss: 0.0906026153249687
0.6587443183859859
Epoch 161/200, Loss: 0.090376346549961
0.6624056444765022
E

[I 2024-01-21 01:37:44,967] Trial 75 finished with value: 0.663669714001661 and parameters: {'hidden_dim_h': 17, 'dropout': 0.050231414385480525, 'batch_size': 225}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.1914318247442752
0.6093849372793689
Epoch 11/200, Loss: 0.10995862395626253
0.6449600958073257
Epoch 21/200, Loss: 0.09658366956014548
0.6537027302394344
Epoch 31/200, Loss: 0.09352740810244484
0.6469163234008675
Epoch 41/200, Loss: 0.09327906976758907
0.660623030670016
Epoch 51/200, Loss: 0.09319192856813954
0.652809677965157
Epoch 61/200, Loss: 0.09276856069939327
0.6575224695601138
Epoch 71/200, Loss: 0.09238608267191237
0.657082753125476
Epoch 81/200, Loss: 0.09212246154789376
0.6594727721089881
Epoch 91/200, Loss: 0.09186113480709296
0.6585274712532191
Epoch 101/200, Loss: 0.09148990085958379
0.662068612806481
Epoch 111/200, Loss: 0.09125186252383004
0.6564370478939139
Epoch 121/200, Loss: 0.09165293268397846
0.6597433827514769
Epoch 131/200, Loss: 0.09151945790622086
0.6593205514770643
Epoch 141/200, Loss: 0.09143863400790543
0.6559377738601251
Epoch 151/200, Loss: 0.09146702137932314
0.6566487161050738
Epoch 161/200, Loss: 0.09167893382564055
0.6613549192861

[I 2024-01-21 01:39:03,826] Trial 76 finished with value: 0.662068612806481 and parameters: {'hidden_dim_h': 49, 'dropout': 0.06754028108531485, 'batch_size': 177}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.5124441231450727
0.5840590392755846
Epoch 11/200, Loss: 0.18275715506845905
0.6404747508254085
Epoch 21/200, Loss: 0.12792347587885394
0.6469371019101501
Epoch 31/200, Loss: 0.12051017342075225
0.6536922700462217
Epoch 41/200, Loss: 0.1153586009337056
0.6562216613883064
Epoch 51/200, Loss: 0.11131071755962987
0.6546493360652716
Epoch 61/200, Loss: 0.10638854099858192
0.6573431482039201
Epoch 71/200, Loss: 0.10250665151303814
0.6564906349573193
Epoch 81/200, Loss: 0.09928280980356279
0.6596575816694529
Epoch 91/200, Loss: 0.09625065879475686
0.658645210129083
Epoch 101/200, Loss: 0.0934685168247069
0.6582302497367422
Epoch 111/200, Loss: 0.0926688291853474
0.658276406818411
Epoch 121/200, Loss: 0.09091241297221953
0.6599064982786386
Epoch 131/200, Loss: 0.09042978791459914
0.660253060813934
Epoch 141/200, Loss: 0.09006497960898184
0.6643064264846936
Epoch 151/200, Loss: 0.09033723487969368
0.6599378585699555
Epoch 161/200, Loss: 0.08926862670529273
0.662318210117477

[I 2024-01-21 01:39:47,062] Trial 77 finished with value: 0.6643064264846936 and parameters: {'hidden_dim_h': 20, 'dropout': 0.09251449333356777, 'batch_size': 656}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.7449345333235604
0.567940831812402
Epoch 11/200, Loss: 0.35840465873479843
0.6221173849263423
Epoch 21/200, Loss: 0.25117742855634007
0.6367968908079136
Epoch 31/200, Loss: 0.22293642269713537
0.6401891300876212
Epoch 41/200, Loss: 0.20548608100840024
0.6430202153389868
Epoch 51/200, Loss: 0.189235407859087
0.6467274780141489
Epoch 61/200, Loss: 0.17297067173889705
0.6423729598663744
Epoch 71/200, Loss: 0.1571078518671649
0.6451652698609669
Epoch 81/200, Loss: 0.14265355308141028
0.650423344466876
Epoch 91/200, Loss: 0.13063063179808004
0.6527436441487708
Epoch 101/200, Loss: 0.11999159253069333
0.6561696738012047
Epoch 111/200, Loss: 0.11093480273016862
0.6524037764187988
Epoch 121/200, Loss: 0.10451054040874753
0.6603933405120912
Epoch 131/200, Loss: 0.09924139348523957
0.6579193475131772
Epoch 141/200, Loss: 0.09550972761852401
0.6578447647282221
Epoch 151/200, Loss: 0.09297399621989046
0.6588465504201545
Epoch 161/200, Loss: 0.09162157561097826
0.65928972916672

[I 2024-01-21 01:40:29,911] Trial 78 finished with value: 0.6626004008293709 and parameters: {'hidden_dim_h': 14, 'dropout': 0.09355113529041768, 'batch_size': 729}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.4776155064503352
0.5741527239327786
Epoch 11/200, Loss: 0.26415807058413826
0.6548793253107321
Epoch 21/200, Loss: 0.22739666452010474
0.6517386939196073
Epoch 31/200, Loss: 0.20149551679690678
0.6527519682605146
Epoch 41/200, Loss: 0.17620320965846378
0.6552611096182503
Epoch 51/200, Loss: 0.15409680257240932
0.6520473751900231
Epoch 61/200, Loss: 0.13590838784972828
0.6573396221042291
Epoch 71/200, Loss: 0.12105781709154446
0.6540799126644538
Epoch 81/200, Loss: 0.10984669476747513
0.6576162162300185
Epoch 91/200, Loss: 0.10207993959387143
0.6583250662717787
Epoch 101/200, Loss: 0.097072634100914
0.6570504799700292
Epoch 111/200, Loss: 0.09414357195297877
0.6593698002827488
Epoch 121/200, Loss: 0.09163009350498517
0.6582361845739063
Epoch 131/200, Loss: 0.09031725352009137
0.6610036334872929
Epoch 141/200, Loss: 0.09016767889261246
0.6584058018472959
Epoch 151/200, Loss: 0.09045543149113655
0.6583620422509591
Epoch 161/200, Loss: 0.08993792658050855
0.66043661674

[I 2024-01-21 01:41:12,467] Trial 79 finished with value: 0.6619274152143265 and parameters: {'hidden_dim_h': 18, 'dropout': 0.0824678521465067, 'batch_size': 680}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.6189679944956744
0.5787862361045243
Epoch 11/200, Loss: 0.2864532040225135
0.6396511924960984
Epoch 21/200, Loss: 0.19865788298624534
0.64389731410306
Epoch 31/200, Loss: 0.1797685694915277
0.6488841401967086
Epoch 41/200, Loss: 0.16986862983968523
0.6545138535889288
Epoch 51/200, Loss: 0.1597901764843199
0.6511392128658974
Epoch 61/200, Loss: 0.14993267368387292
0.6550879665123779
Epoch 71/200, Loss: 0.13980722261799705
0.6541782430048639
Epoch 81/200, Loss: 0.13048569609721503
0.653310061338924
Epoch 91/200, Loss: 0.12204586410963977
0.655574036746509
Epoch 101/200, Loss: 0.11484600962312133
0.6564323830673446
Epoch 111/200, Loss: 0.10811401324139701
0.6515858123233637
Epoch 121/200, Loss: 0.10271311468548244
0.659756869263776
Epoch 131/200, Loss: 0.09922979965254113
0.6582218467996694
Epoch 141/200, Loss: 0.0959726635504652
0.6602498699625065
Epoch 151/200, Loss: 0.09342916696159928
0.6556121020206122
Epoch 161/200, Loss: 0.09215425644759778
0.6562184685010957
E

[I 2024-01-21 01:41:56,598] Trial 80 finished with value: 0.6607058043842526 and parameters: {'hidden_dim_h': 24, 'dropout': 0.10949644160390298, 'batch_size': 743}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.23389283418655396
0.5833207776680657
Epoch 11/200, Loss: 0.1694165642062823
0.6471240910403494
Epoch 21/200, Loss: 0.14848438749710718
0.6533310717041714
Epoch 31/200, Loss: 0.13081154252092045
0.6540723371662721
Epoch 41/200, Loss: 0.11710994144280752
0.6540682575575303
Epoch 51/200, Loss: 0.10654663542906444
0.6559993186941565
Epoch 61/200, Loss: 0.09985380346576372
0.6576497163472507
Epoch 71/200, Loss: 0.09487837205330531
0.66086249598955
Epoch 81/200, Loss: 0.09270883426070213
0.6572296131278762
Epoch 91/200, Loss: 0.09094257603089015
0.6613877388547664
Epoch 101/200, Loss: 0.09014370416601498
0.6595936203460014
Epoch 111/200, Loss: 0.08977930297454198
0.6584304109360837
Epoch 121/200, Loss: 0.08937120561798413
0.6601433792971648
Epoch 131/200, Loss: 0.08971691975990931
0.6617035272230168
Epoch 141/200, Loss: 0.08943112293879191
0.6632021413555655
Epoch 151/200, Loss: 0.0895451158285141
0.6597620150196016
Epoch 161/200, Loss: 0.0896641418337822
0.6581294905435

[I 2024-01-21 01:42:39,273] Trial 81 finished with value: 0.6634991960671341 and parameters: {'hidden_dim_h': 20, 'dropout': 0.05863346803652595, 'batch_size': 675}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.359818086904638
0.5726645987369063
Epoch 11/200, Loss: 0.6008475300143746
0.6222261702172657
Epoch 21/200, Loss: 0.3256475189152886
0.6385780420909944
Epoch 31/200, Loss: 0.24724813506883733
0.6466009783500689
Epoch 41/200, Loss: 0.22401126868584575
0.6453245556474471
Epoch 51/200, Loss: 0.2082397205864682
0.6513156300971088
Epoch 61/200, Loss: 0.19229901713483474
0.6512620890788559
Epoch 71/200, Loss: 0.17604839933269165
0.6459344682963846
Epoch 81/200, Loss: 0.16061106192715027
0.6476137216555846
Epoch 91/200, Loss: 0.14509247243404388
0.6553655500323806
Epoch 101/200, Loss: 0.1320560758604723
0.6507472383741019
Epoch 111/200, Loss: 0.11987264366710887
0.6522954330217883
Epoch 121/200, Loss: 0.11103534632745911
0.6582327184543104
Epoch 131/200, Loss: 0.10392331134747057
0.6487121640938606
Epoch 141/200, Loss: 0.09787882689167471
0.6580920366748618
Epoch 151/200, Loss: 0.09413872067542638
0.6571601703319158
Epoch 161/200, Loss: 0.09267440394443624
0.65704336711868

[I 2024-01-21 01:43:23,220] Trial 82 finished with value: 0.6630032819584926 and parameters: {'hidden_dim_h': 17, 'dropout': 0.09018465872566377, 'batch_size': 600}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.22125918890644863
0.5904008873048169
Epoch 11/200, Loss: 0.11493357666200255
0.6482225579112789
Epoch 21/200, Loss: 0.09716423505508318
0.6429871030370431
Epoch 31/200, Loss: 0.09563913448463852
0.661842195998176
Epoch 41/200, Loss: 0.09516289925611601
0.6546384784056746
Epoch 51/200, Loss: 0.09478364453264852
0.6569782078344043
Epoch 61/200, Loss: 0.09456663692324627
0.6547021604839425
Epoch 71/200, Loss: 0.093856428954296
0.6606910065337177
Epoch 81/200, Loss: 0.0941843598535875
0.661435030885598
Epoch 91/200, Loss: 0.09400739393583159
0.6570740255580212
Epoch 101/200, Loss: 0.09350068671855985
0.6583761636206072
Epoch 111/200, Loss: 0.09343438577361224
0.6579959700887381
Epoch 121/200, Loss: 0.09370633419148805
0.6600748212236174
Epoch 131/200, Loss: 0.09339831583201885
0.658750122607919
Epoch 141/200, Loss: 0.09301727196973998
0.6614092886305049
Epoch 151/200, Loss: 0.09313306594040335
0.659461876415628
Epoch 161/200, Loss: 0.09308766605468785
0.656896444072815

[I 2024-01-21 01:44:58,468] Trial 83 finished with value: 0.661842195998176 and parameters: {'hidden_dim_h': 15, 'dropout': 0.21524361210962883, 'batch_size': 122}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.5514990378029739
0.5999654259954836
Epoch 11/200, Loss: 0.2108405800182608
0.6437720738228162
Epoch 21/200, Loss: 0.1633156666272803
0.6426379164681837
Epoch 31/200, Loss: 0.12597511520114127
0.6465706066785241
Epoch 41/200, Loss: 0.10503444198188902
0.6515998338202789
Epoch 51/200, Loss: 0.096014009057721
0.6508663116500174
Epoch 61/200, Loss: 0.0932941809296608
0.6583914245263659
Epoch 71/200, Loss: 0.09312427345710465
0.6574553119698422
Epoch 81/200, Loss: 0.092087956451917
0.6594273271932413
Epoch 91/200, Loss: 0.0918948707889907
0.6613609967078267
Epoch 101/200, Loss: 0.0916289708848241
0.6558042581304457
Epoch 111/200, Loss: 0.09138955996383595
0.6584618223838021
Epoch 121/200, Loss: 0.0916262285996087
0.66162575948067
Epoch 131/200, Loss: 0.09165791742786576
0.6554189875191193
Epoch 141/200, Loss: 0.09170831598435776
0.6586477298464694
Epoch 151/200, Loss: 0.0915535909088352
0.6579996171129618
Epoch 161/200, Loss: 0.0911770847779286
0.6613969496777108
Epoch 

[I 2024-01-21 01:46:06,749] Trial 84 finished with value: 0.6631303946022532 and parameters: {'hidden_dim_h': 47, 'dropout': 0.11828572936251142, 'batch_size': 255}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.0810937285423279
0.5685320192180516
Epoch 11/200, Loss: 0.5517638188142043
0.6238608603756347
Epoch 21/200, Loss: 0.32977452186437756
0.6378274415710533
Epoch 31/200, Loss: 0.25290005711408764
0.6383781962607
Epoch 41/200, Loss: 0.227241833622639
0.6436687689580366
Epoch 51/200, Loss: 0.21328556881501123
0.6439243034119221
Epoch 61/200, Loss: 0.2001802004300631
0.6449554985093224
Epoch 71/200, Loss: 0.1870653090568689
0.6506412441502094
Epoch 81/200, Loss: 0.17404201798714125
0.6542421208815041
Epoch 91/200, Loss: 0.16133390710904047
0.6492582462965062
Epoch 101/200, Loss: 0.1488330983198606
0.6498719083324141
Epoch 111/200, Loss: 0.13780022641787162
0.6507385235512902
Epoch 121/200, Loss: 0.12784148781345442
0.6533105906361978
Epoch 131/200, Loss: 0.11865433878623523
0.6552661178009552
Epoch 141/200, Loss: 0.11162791257867447
0.6541213203416453
Epoch 151/200, Loss: 0.10551541871749438
0.6553192236719252
Epoch 161/200, Loss: 0.10103667240876418
0.6575766138404658
E

[I 2024-01-21 01:46:59,237] Trial 85 finished with value: 0.6575766138404658 and parameters: {'hidden_dim_h': 43, 'dropout': 0.0697917854016413, 'batch_size': 780}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.9045303937716361
0.5788779396114327
Epoch 11/200, Loss: 0.3066914417804816
0.6368522285596144
Epoch 21/200, Loss: 0.1753227649590908
0.6413493536143684
Epoch 31/200, Loss: 0.15595531578247362
0.6460019212308378
Epoch 41/200, Loss: 0.14638535028848892
0.647362722707278
Epoch 51/200, Loss: 0.13757183536505088
0.6571216772742954
Epoch 61/200, Loss: 0.12953407412920243
0.6456358799082998
Epoch 71/200, Loss: 0.11879982302586238
0.6550043079881163
Epoch 81/200, Loss: 0.11247785752400374
0.6513856099683708
Epoch 91/200, Loss: 0.1044919830866349
0.6522900142416654
Epoch 101/200, Loss: 0.1000265889824965
0.6522075818750015
Epoch 111/200, Loss: 0.09560140031270492
0.6558935520790801
Epoch 121/200, Loss: 0.09406547649548604
0.6558564070806071
Epoch 131/200, Loss: 0.09331722691273078
0.6578349343163855
Epoch 141/200, Loss: 0.09210912310160123
0.6586624714749664
Epoch 151/200, Loss: 0.09142984583591804
0.6523958150743983
Epoch 161/200, Loss: 0.09069371968507767
0.66043267878348

[I 2024-01-21 01:47:54,204] Trial 86 finished with value: 0.6620159719780269 and parameters: {'hidden_dim_h': 45, 'dropout': 0.13438881080746362, 'batch_size': 525}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.36343575853567855
0.5814933390132416
Epoch 11/200, Loss: 0.20927811792263618
0.6497445842215211
Epoch 21/200, Loss: 0.14884959138356724
0.6446069498358031
Epoch 31/200, Loss: 0.11445102909436593
0.657169181743864
Epoch 41/200, Loss: 0.09831358022414721
0.6564341416269915
Epoch 51/200, Loss: 0.09343369350983546
0.6561080898313628
Epoch 61/200, Loss: 0.09140934737829062
0.6566984589232925
Epoch 71/200, Loss: 0.09114998636337426
0.6596682797155998
Epoch 81/200, Loss: 0.09081367758604196
0.6607783773599601
Epoch 91/200, Loss: 0.09023820494229977
0.6604787088541845
Epoch 101/200, Loss: 0.09064839608394183
0.6611296774942513
Epoch 111/200, Loss: 0.09035357202474888
0.6598499572183824
Epoch 121/200, Loss: 0.09003865936627754
0.6600230472281728
Epoch 131/200, Loss: 0.0905206872866704
0.6579397999311253
Epoch 141/200, Loss: 0.08994946674658702
0.6606983934594932
Epoch 151/200, Loss: 0.08987636829798039
0.6621703036930011
Epoch 161/200, Loss: 0.08973739124261416
0.6600394275

[I 2024-01-21 01:48:50,186] Trial 87 finished with value: 0.6634758818702162 and parameters: {'hidden_dim_h': 20, 'dropout': 0.08160203394100811, 'batch_size': 309}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.40044074558785986
0.5999989935897525
Epoch 11/200, Loss: 0.17257011947887285
0.6395243311274142
Epoch 21/200, Loss: 0.14608393529696123
0.6392781587512029
Epoch 31/200, Loss: 0.12249849177896976
0.6479577110926736
Epoch 41/200, Loss: 0.10673876000302178
0.6478605097442713
Epoch 51/200, Loss: 0.09812296048871108
0.6553294054415328
Epoch 61/200, Loss: 0.09409291403634208
0.6565122328252682
Epoch 71/200, Loss: 0.09310432297310658
0.6574823548102273
Epoch 81/200, Loss: 0.09191912811781679
0.6579369742511181
Epoch 91/200, Loss: 0.0920942138348307
0.6586328422997357
Epoch 101/200, Loss: 0.09102604697857584
0.65967705713122
Epoch 111/200, Loss: 0.0910307816894991
0.660455622267194
Epoch 121/200, Loss: 0.09121492984039443
0.6605809756497444
Epoch 131/200, Loss: 0.09068939182907343
0.6627702437318087
Epoch 141/200, Loss: 0.09098801482468843
0.6576902178350092
Epoch 151/200, Loss: 0.09009491785296372
0.6594503206448787
Epoch 161/200, Loss: 0.09101648708539349
0.6599610723032

[I 2024-01-21 01:49:51,965] Trial 88 finished with value: 0.6627702437318087 and parameters: {'hidden_dim_h': 50, 'dropout': 0.10140537502445937, 'batch_size': 362}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.3636390440391772
0.5996613223204748
Epoch 11/200, Loss: 0.18339668620716443
0.6128221599335867
Epoch 21/200, Loss: 0.1194402686122692
0.6492535245170489
Epoch 31/200, Loss: 0.10102840091543969
0.6551886896005367
Epoch 41/200, Loss: 0.09341554885560815
0.6600600018092798
Epoch 51/200, Loss: 0.09173812589260062
0.6522831068014971
Epoch 61/200, Loss: 0.09199511263557154
0.656445433984558
Epoch 71/200, Loss: 0.09253271766985306
0.6575358396168766
Epoch 81/200, Loss: 0.09255369654809585
0.6577116364495865
Epoch 91/200, Loss: 0.092708725595113
0.6581865274862093
Epoch 101/200, Loss: 0.09125990834501055
0.6581389610329629
Epoch 111/200, Loss: 0.09159908014716524
0.6585519500356773
Epoch 121/200, Loss: 0.09152986041524193
0.6570833556618445
Epoch 131/200, Loss: 0.0911143808954894
0.6565487110372504
Epoch 141/200, Loss: 0.09179969214730793
0.6645336529317225
Epoch 151/200, Loss: 0.09147956628691066
0.6610615773109872
Epoch 161/200, Loss: 0.09114857868413732
0.65955215069638

[I 2024-01-21 01:51:00,443] Trial 89 finished with value: 0.6645336529317225 and parameters: {'hidden_dim_h': 35, 'dropout': 0.060275976419738905, 'batch_size': 204}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.38260221605499584
0.597512608302375
Epoch 11/200, Loss: 0.11395140566552679
0.644540364783246
Epoch 21/200, Loss: 0.10240377384858827
0.6537411023849087
Epoch 31/200, Loss: 0.09568273966821532
0.6515907915591661
Epoch 41/200, Loss: 0.09273625968489796
0.655071506675596
Epoch 51/200, Loss: 0.09189310336175065
0.6575205383371551
Epoch 61/200, Loss: 0.09227565582841635
0.6532829642415262
Epoch 71/200, Loss: 0.09175213434112568
0.6591557650344423
Epoch 81/200, Loss: 0.09151349465052287
0.6517826504411429
Epoch 91/200, Loss: 0.0910537396169578
0.6584600926039814
Epoch 101/200, Loss: 0.09173610457219183
0.6608595614542538
Epoch 111/200, Loss: 0.0909019581352671
0.657854374509909
Epoch 121/200, Loss: 0.09130763627278309
0.656772333904508
Epoch 131/200, Loss: 0.09086917891787986
0.6630296804086808
Epoch 141/200, Loss: 0.09136925230268389
0.6628645104017179
Epoch 151/200, Loss: 0.09154810973753531
0.6562036369442811
Epoch 161/200, Loss: 0.09079140556665759
0.664683331769313

[I 2024-01-21 01:52:07,435] Trial 90 finished with value: 0.6646833317693135 and parameters: {'hidden_dim_h': 35, 'dropout': 0.06030961979516043, 'batch_size': 210}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 2.007251019429679
0.5582732968392025
Epoch 11/200, Loss: 0.33512618291107094
0.6299990864222992
Epoch 21/200, Loss: 0.22745602675760634
0.6519134212942319
Epoch 31/200, Loss: 0.18544915258282363
0.6402557457822863
Epoch 41/200, Loss: 0.14308542253995182
0.6403425924313525
Epoch 51/200, Loss: 0.11369286266842274
0.6480396108869536
Epoch 61/200, Loss: 0.09934188922246297
0.6472482068822693
Epoch 71/200, Loss: 0.09393193399665331
0.6523813036458772
Epoch 81/200, Loss: 0.09176269587543276
0.6575619837159099
Epoch 91/200, Loss: 0.09158461059283729
0.6566534417159419
Epoch 101/200, Loss: 0.09204500906094155
0.6598820537203608
Epoch 111/200, Loss: 0.09421832769206076
0.6568449722220232
Epoch 121/200, Loss: 0.09105997510028607
0.6550220133856559
Epoch 131/200, Loss: 0.09252385320988568
0.6579810810410058
Epoch 141/200, Loss: 0.09086050443125493
0.6635716452906926
Epoch 151/200, Loss: 0.09199839642252584
0.6586765485229796
Epoch 161/200, Loss: 0.09034694618347919
0.6609683228

[I 2024-01-21 01:53:16,006] Trial 91 finished with value: 0.6635716452906926 and parameters: {'hidden_dim_h': 37, 'dropout': 0.06073707472726709, 'batch_size': 204}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.6284126106832848
0.5962860684972296
Epoch 11/200, Loss: 0.21336329679508678
0.6314634290906456
Epoch 21/200, Loss: 0.1392527168891469
0.6413145191315899
Epoch 31/200, Loss: 0.10283750936877532
0.6467227818907425
Epoch 41/200, Loss: 0.0939841228918951
0.6527432745226391
Epoch 51/200, Loss: 0.09291059627640443
0.6517689475628258
Epoch 61/200, Loss: 0.09323271199083719
0.658827925529975
Epoch 71/200, Loss: 0.09241421862703855
0.6598681132157846
Epoch 81/200, Loss: 0.09149223917209712
0.6588593457980694
Epoch 91/200, Loss: 0.09126771558992199
0.6576593860224756
Epoch 101/200, Loss: 0.09156758478674733
0.6604373527469934
Epoch 111/200, Loss: 0.09171770244348244
0.6629598931197264
Epoch 121/200, Loss: 0.09127886791820408
0.6563045688008028
Epoch 131/200, Loss: 0.0911474834944381
0.652377362480216
Epoch 141/200, Loss: 0.09079566988788668
0.6617636590176672
Epoch 151/200, Loss: 0.09073309841581055
0.6608051828013708
Epoch 161/200, Loss: 0.09166847859494022
0.66244937106761

[I 2024-01-21 01:54:33,449] Trial 92 finished with value: 0.6629598931197264 and parameters: {'hidden_dim_h': 33, 'dropout': 0.07717946276585179, 'batch_size': 165}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 2.154298252894961
0.5626750287387161
Epoch 11/200, Loss: 0.1462379788530284
0.6275750583836779
Epoch 21/200, Loss: 0.11618190294709699
0.6466697120334909
Epoch 31/200, Loss: 0.10375836897512962
0.6553616103604563
Epoch 41/200, Loss: 0.09572634681545455
0.6528064197523061
Epoch 51/200, Loss: 0.09398047651710181
0.6538454199617325
Epoch 61/200, Loss: 0.09265099807546057
0.6558192085626507
Epoch 71/200, Loss: 0.093080893133221
0.6575159474203958
Epoch 81/200, Loss: 0.09237685614618762
0.6596615958030466
Epoch 91/200, Loss: 0.09258708404055957
0.6578521072266741
Epoch 101/200, Loss: 0.09207413247947036
0.6579862078764035
Epoch 111/200, Loss: 0.09205748752273363
0.6520506443887581
Epoch 121/200, Loss: 0.09173104249197861
0.6618980448028855
Epoch 131/200, Loss: 0.09159675800594791
0.6571336472183957
Epoch 141/200, Loss: 0.09161376326248563
0.6580795126388471
Epoch 151/200, Loss: 0.0914755755971218
0.6619798634037783
Epoch 161/200, Loss: 0.09231247824841532
0.66305490579138

[I 2024-01-21 01:56:01,091] Trial 93 finished with value: 0.6633769047890135 and parameters: {'hidden_dim_h': 40, 'dropout': 0.06673869174481639, 'batch_size': 138}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.0986729465335248
0.5888848297395938
Epoch 11/200, Loss: 0.18827389665396818
0.6289330102173111
Epoch 21/200, Loss: 0.15158959900040225
0.6378379615012327
Epoch 31/200, Loss: 0.13217373632163887
0.6463012836107817
Epoch 41/200, Loss: 0.11472995148365756
0.6480933496532574
Epoch 51/200, Loss: 0.10221145984279104
0.6501896909872397
Epoch 61/200, Loss: 0.09608776149261429
0.654450941385792
Epoch 71/200, Loss: 0.0938130804752729
0.658341906439003
Epoch 81/200, Loss: 0.09306431884866163
0.6603654835436016
Epoch 91/200, Loss: 0.0928449298602989
0.6566698539007435
Epoch 101/200, Loss: 0.09252228668655257
0.6594948132201581
Epoch 111/200, Loss: 0.09212369920618563
0.6538050501824452
Epoch 121/200, Loss: 0.09172197916062481
0.6583789678119896
Epoch 131/200, Loss: 0.09194527081696384
0.6605936137225003
Epoch 141/200, Loss: 0.09205478304121868
0.6581162334416617
Epoch 151/200, Loss: 0.09212066466549793
0.659428828509657
Epoch 161/200, Loss: 0.09206440111240709
0.6615525922352


[I 2024-01-21 01:57:06,569] Trial 94 finished with value: 0.6615525922352 and parameters: {'hidden_dim_h': 35, 'dropout': 0.05625781126540962, 'batch_size': 241}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.2861074793797273
0.5976041901396337
Epoch 11/200, Loss: 0.14258927164169458
0.627050612387617
Epoch 21/200, Loss: 0.10415602396600522
0.6472240564975517
Epoch 31/200, Loss: 0.0944610801883615
0.6558072115436316
Epoch 41/200, Loss: 0.09272589856901994
0.6567084463652458
Epoch 51/200, Loss: 0.09210357585778603
0.6512607510094579
Epoch 61/200, Loss: 0.09183110604779078
0.660732327956831
Epoch 71/200, Loss: 0.09217915146683271
0.6581286940486875
Epoch 81/200, Loss: 0.09144396650103423
0.659865580211881
Epoch 91/200, Loss: 0.09176480103857242
0.6610285383756458
Epoch 101/200, Loss: 0.09170660605797401
0.6597694484132803
Epoch 111/200, Loss: 0.09175507466380413
0.6602061803809838
Epoch 121/200, Loss: 0.09143498375152166
0.6600147483771067
Epoch 131/200, Loss: 0.09134710429666135
0.6596188169773617
Epoch 141/200, Loss: 0.09076990667157449
0.6583963845942666
Epoch 151/200, Loss: 0.09086082159326626
0.6625072438249728
Epoch 161/200, Loss: 0.09107499648458682
0.6580397176106

[I 2024-01-21 01:58:17,214] Trial 95 finished with value: 0.6625072438249728 and parameters: {'hidden_dim_h': 34, 'dropout': 0.07382139720396065, 'batch_size': 193}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.27125503962978403
0.5902894755354492
Epoch 11/200, Loss: 0.1492468016420273
0.6351144585015361
Epoch 21/200, Loss: 0.11274416863601258
0.6472830697855678
Epoch 31/200, Loss: 0.09768859986612137
0.6534082423655264
Epoch 41/200, Loss: 0.09374928038488044
0.6525470395987933
Epoch 51/200, Loss: 0.09287299461504246
0.6539015858187458
Epoch 61/200, Loss: 0.0921525186363687
0.6578368290875509
Epoch 71/200, Loss: 0.09244081766364422
0.6551015344234612
Epoch 81/200, Loss: 0.09167628584707037
0.660593613151572
Epoch 91/200, Loss: 0.09127855237494124
0.6562691932722104
Epoch 101/200, Loss: 0.09164231310182429
0.6531823243801131
Epoch 111/200, Loss: 0.09174460465920732
0.6592918434694099
Epoch 121/200, Loss: 0.09153373935755263
0.6551271228639379
Epoch 131/200, Loss: 0.09153285606744442
0.6551164204710098
Epoch 141/200, Loss: 0.09155455612121745
0.6580941671865298
Epoch 151/200, Loss: 0.09153180188955144
0.6586168803431779
Epoch 161/200, Loss: 0.09083485587480221
0.65756431550

[I 2024-01-21 01:59:27,384] Trial 96 finished with value: 0.6607764835883926 and parameters: {'hidden_dim_h': 48, 'dropout': 0.09247084478871753, 'batch_size': 213}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.38942487204545423
0.5951430725509415
Epoch 11/200, Loss: 0.15742408126396568
0.6380106115506133
Epoch 21/200, Loss: 0.10176118860315335
0.652055343356655
Epoch 31/200, Loss: 0.09387120888813545
0.6573952737465008
Epoch 41/200, Loss: 0.09294985695496986
0.6574733007602949
Epoch 51/200, Loss: 0.09238226015708949
0.6540226147033179
Epoch 61/200, Loss: 0.09242219522007201
0.656575047173198
Epoch 71/200, Loss: 0.09235518964889802
0.6579513809046672
Epoch 81/200, Loss: 0.09182586116520197
0.6580276569148131
Epoch 91/200, Loss: 0.09205697557741874
0.6620608595052654
Epoch 101/200, Loss: 0.09171035748563315
0.6616110118618408
Epoch 111/200, Loss: 0.09138008692350827
0.6559800879424474
Epoch 121/200, Loss: 0.09108615144597072
0.661374171726033
Epoch 131/200, Loss: 0.09126758690629351
0.6594840283662461
Epoch 141/200, Loss: 0.09123209604111157
0.6597832492730819
Epoch 151/200, Loss: 0.09116428543960578
0.6576538608143032
Epoch 161/200, Loss: 0.091422410142657
0.6605129702476

[I 2024-01-21 02:00:57,173] Trial 97 finished with value: 0.6620608595052654 and parameters: {'hidden_dim_h': 32, 'dropout': 0.05785998209060859, 'batch_size': 132}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 1.830071856578191
0.5592917053638918
Epoch 11/200, Loss: 1.0538634061813354
0.6089042614656754
Epoch 21/200, Loss: 0.5818028226494789
0.6151050374885434
Epoch 31/200, Loss: 0.3257960689564546
0.6286241391166666
Epoch 41/200, Loss: 0.19824273760120073
0.6413228067618507
Epoch 51/200, Loss: 0.14502042904496193
0.6446928553275644
Epoch 61/200, Loss: 0.12448183167725801
0.6478499569861749
Epoch 71/200, Loss: 0.11817128335436185
0.6544007609208837
Epoch 81/200, Loss: 0.11539523086200158
0.6559776526569688
Epoch 91/200, Loss: 0.11380870236704747
0.6503211746792597
Epoch 101/200, Loss: 0.11145906522870064
0.6541468697649387
Epoch 111/200, Loss: 0.10962036438286304
0.6546939343595215
Epoch 121/200, Loss: 0.10769991421451171
0.6568302946732829
Epoch 131/200, Loss: 0.10661161411553621
0.6587028091153116
Epoch 141/200, Loss: 0.10370716545730829
0.6551643271634248
Epoch 151/200, Loss: 0.10093490375826757
0.6531094515278538
Epoch 161/200, Loss: 0.0992381488904357
0.65839803399799

[I 2024-01-21 02:01:46,867] Trial 98 finished with value: 0.6598079989656077 and parameters: {'hidden_dim_h': 37, 'dropout': 0.05050732929156832, 'batch_size': 864}. Best is trial 63 with value: 0.6648751940069384.


Epoch 1/200, Loss: 0.5434712215264639
0.5853235988423128
Epoch 11/200, Loss: 0.19275273104508717
0.6426917394975634
Epoch 21/200, Loss: 0.15576207796732586
0.6472361160532307
Epoch 31/200, Loss: 0.12501579274733862
0.6526708806814743
Epoch 41/200, Loss: 0.10516170918941498
0.6504309376753201
Epoch 51/200, Loss: 0.09719556589921316
0.6504814462432614
Epoch 61/200, Loss: 0.09389367947975795
0.6491078532863973
Epoch 71/200, Loss: 0.09359014679988226
0.6572431522624242
Epoch 81/200, Loss: 0.09232621848583221
0.6535109013944189
Epoch 91/200, Loss: 0.0914962038397789
0.658468819708447
Epoch 101/200, Loss: 0.0921810598174731
0.6572389944928753
Epoch 111/200, Loss: 0.09195147335529327
0.6563838977848746
Epoch 121/200, Loss: 0.09120493372281392
0.6589442780849161
Epoch 131/200, Loss: 0.09282215336958567
0.6551530300643144
Epoch 141/200, Loss: 0.09106589814027151
0.6575678456785874
Epoch 151/200, Loss: 0.09112474878629048
0.6560405400214624
Epoch 161/200, Loss: 0.09092344423135122
0.660758927454

[I 2024-01-21 02:02:51,763] Trial 99 finished with value: 0.6613014779882631 and parameters: {'hidden_dim_h': 41, 'dropout': 0.085138958756978, 'batch_size': 270}. Best is trial 63 with value: 0.6648751940069384.


Best Trial:
  Value: 0.6649
  Params: 
    hidden_dim_h: 15
    dropout: 0.06118622949287433
    batch_size: 267
