START TIME: Fri Oct 27 12:38:45 CST 2023 e08r2n08 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================0 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================1 WORLD_SIZE*************96 LRANK===============================2 WORLD_SIZE*************96 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================2 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 LRANK===============================2 LRANK===============================2 LRANK===============================2 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 LRANK===============================3 LRANK===============================3 LRANK===============================3 LRANK===============================3 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 WORLD_SIZE*************96 LRANK===============================3 LRANK===============================3 WORLD_SIZE*************96 WORLD_SIZE*************96 [2023-10-27 12:39:32,920] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,921] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,930] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,921] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,920] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,921] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,929] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,924] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,929] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,929] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,929] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,922] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,921] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,923] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,923] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,930] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,926] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,924] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,921] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,932] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,924] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,926] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,932] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,934] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,924] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,928] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,926] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,935] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,938] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,926] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,925] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,938] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,936] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,937] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,927] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:32,933] [INFO] [comm.py:606:init_distributed] Not using the DeepSpeed or dist launchers, attempting to detect MPI environment... [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=0, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=1, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:622:init_distributed] Initializing TorchBackend in DeepSpeed with backend nccl [2023-10-27 12:39:33,206] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=13, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=28, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=85, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=45, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=49, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,206] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=12, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=29, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=84, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=44, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=48, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=25, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=53, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,203] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=33, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,194] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=89, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=36, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=40, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=69, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=21, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=57, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=17, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=61, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=9, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=81, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=93, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=5, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=77, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=24, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=52, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,203] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=32, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,194] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=88, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=37, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=41, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=68, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=20, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=56, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=16, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=60, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=8, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=80, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=92, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=4, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=76, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=65, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=73, local_rank=1, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,207] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=64, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=72, local_rank=0, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,205] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=3, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,205] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=2, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=59, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=11, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=87, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=95, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,210] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=47, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=19, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=91, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=43, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=7, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=79, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=15, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=71, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=55, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=27, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=51, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,201] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=31, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=23, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,210] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=83, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,205] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=75, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=39, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=63, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=58, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=10, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,200] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=86, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=94, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,210] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=46, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=18, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,196] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=90, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=42, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=6, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,198] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=78, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=14, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,199] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=70, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=54, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=26, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=50, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,201] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=30, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,209] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=22, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,210] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=82, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,205] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=74, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=38, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,197] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=62, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=67, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,208] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=66, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=35, local_rank=3, world_size=96, master_addr=10.5.8.29, master_port=29500 [2023-10-27 12:39:33,204] [INFO] [comm.py:656:mpi_discovery] Discovered MPI settings of world_rank=34, local_rank=2, world_size=96, master_addr=10.5.8.29, master_port=29500 e08r2n08:5136:5136 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.29<0> e08r2n08:5136:5136 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n08:5136:5136 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation RCCL version 2.13.4+hip5.4 HEAD:82f11f7 e08r2n08:5142:5142 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.29<0> e08r2n08:5142:5142 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n08:5142:5142 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n08:5136:6335 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.29<0> e08r2n08:5136:6335 [0] NCCL INFO Using network IB e08r2n08:5140:5140 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.29<0> e08r2n08:5140:5140 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n08:5140:5140 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n08:5141:5141 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.29<0> e08r2n08:5141:5141 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n08:5141:5141 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n07:4889:4889 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.48<0> e08r3n07:4889:4889 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n07:4889:4889 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n09:8675:8675 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.50<0> e08r3n09:8675:8675 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n16:13442:13442 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.37<0> e08r2n16:13442:13442 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n16:13442:13442 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n09:8679:8679 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.50<0> e08r3n09:8679:8679 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n09:8677:8677 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.50<0> e08r3n09:8677:8677 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n19:9030:9030 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.40<0> e08r2n19:9030:9030 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n19:9030:9030 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n02:30401:30401 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.43<0> e08r3n02:30401:30401 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n07:4891:4891 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.48<0> e08r3n07:4891:4891 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n10:18788:18788 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.51<0> e08r3n10:18788:18788 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n02:30401:30401 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n07:4891:4891 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n10:18788:18788 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n16:13444:13444 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.37<0> e08r2n16:13444:13444 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n06:22281:22281 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.47<0> e08r3n06:22281:22281 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n16:13444:13444 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n19:9032:9032 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.40<0> e08r2n19:9032:9032 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n19:9032:9032 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n06:22283:22283 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.47<0> e08r3n06:22283:22283 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29645:29645 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.52<0> e08r3n11:29645:29645 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n19:9033:9033 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.40<0> e08r2n19:9033:9033 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29645:29645 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n03:22735:22735 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.44<0> e08r3n03:22735:22735 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n18:751:751 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.39<0> e08r2n18:751:751 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n19:9033:9033 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n19:9034:9034 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.40<0> e08r2n19:9034:9034 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n00:14532:14532 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.41<0> e08r3n00:14532:14532 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n03:22735:22735 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n09:8679:8679 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n09:8675:8675 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27004:27004 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.30<0> e08r2n09:27004:27004 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n09:8677:8677 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n19:9034:9034 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14532:14532 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27004:27004 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n02:30403:30403 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.43<0> e08r3n02:30403:30403 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n14:18192:18192 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.35<0> e08r2n14:18192:18192 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29647:29647 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.52<0> e08r3n02:30403:30403 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n11:29647:29647 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n01:6275:6275 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.42<0> e08r3n01:6275:6275 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n06:22285:22285 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.47<0> e08r3n06:22285:22285 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29647:29647 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n10:18787:18787 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.51<0> e08r3n10:18787:18787 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29649:29649 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.52<0> e08r3n11:29649:29649 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n10:18787:18787 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n01:6277:6277 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.42<0> e08r3n01:6277:6277 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n18:753:753 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.39<0> e08r2n18:753:753 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16936:16936 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.45<0> e08r3n04:16936:16936 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n18:755:755 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.39<0> e08r2n18:755:755 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29649:29649 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n11:5730:5730 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.32<0> e08r2n11:5730:5730 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n17:21284:21284 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.38<0> e08r2n17:21284:21284 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n14:18194:18194 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.35<0> e08r2n14:18194:18194 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16936:16936 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n11:5730:5730 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n17:21284:21284 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n14:18192:18192 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27002:27002 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.30<0> e08r2n14:18194:18194 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27002:27002 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n06:22284:22284 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.47<0> e08r3n06:22284:22284 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n09:27002:27002 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n18:754:754 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.39<0> e08r2n11:5732:5732 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.32<0> e08r2n11:5732:5732 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n18:754:754 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n11:5732:5732 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n11:29648:29648 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.52<0> e08r3n02:30405:30405 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.43<0> e08r3n11:29648:29648 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n02:30405:30405 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n03:22739:22739 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.44<0> e08r3n03:22739:22739 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n02:30404:30404 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.43<0> e08r3n02:30404:30404 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n00:14534:14534 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.41<0> e08r3n00:14534:14534 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n11:29648:29648 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n03:22739:22739 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n02:30405:30405 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n02:30404:30404 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14534:14534 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n04:16938:16938 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.45<0> e08r3n01:6279:6279 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.42<0> e08r3n01:6279:6279 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16938:16938 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16940:16940 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.45<0> e08r3n04:16940:16940 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16939:16939 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.45<0> e08r3n04:16939:16939 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n09:27005:27005 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.30<0> e08r3n04:16938:16938 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27005:27005 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n04:16940:16940 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n04:16939:16939 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14535:14535 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.41<0> e08r2n09:27005:27005 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14535:14535 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n14:18195:18195 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.35<0> e08r2n15:22021:22021 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.36<0> e08r2n15:22021:22021 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n14:18195:18195 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n00:14535:14535 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n15:22021:22021 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n14:18195:18195 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n12:8673:8673 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.33<0> e08r2n12:8673:8673 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n01:6278:6278 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.42<0> e08r3n01:6278:6278 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n11:5733:5733 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.32<0> e08r2n17:21283:21283 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.38<0> e08r2n11:5733:5733 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n17:21283:21283 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8673:8673 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n09:27006:27006 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.30<0> e08r2n09:27006:27006 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n01:6275:6275 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14536:14536 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.41<0> e08r2n11:5733:5733 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14536:14536 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n17:21282:21282 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.38<0> e08r3n01:6277:6277 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n17:21283:21283 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n01:6279:6279 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n13:23991:23991 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.34<0> e08r2n13:23991:23991 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n17:21282:21282 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n01:6278:6278 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n15:22023:22023 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.36<0> e08r2n15:22023:22023 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n14:18196:18196 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.35<0> e08r2n14:18196:18196 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n09:27006:27006 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n13:23991:23991 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n00:14536:14536 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n10:18786:18786 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.51<0> e08r2n11:5734:5734 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.32<0> e08r3n10:18786:18786 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n11:5734:5734 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n17:21282:21282 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n17:21280:21280 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.38<0> e08r2n17:21280:21280 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n15:22023:22023 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n14:18196:18196 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n10:18786:18786 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n11:5734:5734 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n17:21280:21280 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n07:4892:4892 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.48<0> e08r3n07:4893:4893 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.48<0> e08r3n07:4893:4893 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:874:874 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.31<0> e08r2n10:874:874 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n07:4892:4892 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:874:874 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n07:4892:4892 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n07:4893:4893 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n10:872:872 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.31<0> e08r2n10:872:872 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n13:23993:23993 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.34<0> e08r2n13:23993:23993 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:872:872 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n09:8678:8678 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.50<0> e08r3n09:8678:8678 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8674:8674 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.33<0> e08r2n12:8674:8674 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n13:23993:23993 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13434:13434 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.49<0> e08r3n08:13434:13434 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n09:8678:8678 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n12:8674:8674 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13434:13434 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n16:13445:13445 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.37<0> e08r2n16:13445:13445 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8671:8671 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.33<0> e08r2n12:8671:8671 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n15:22025:22025 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.36<0> e08r2n15:22025:22025 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n16:13445:13445 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n15:22024:22024 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.36<0> e08r2n15:22024:22024 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8671:8671 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13436:13436 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.49<0> e08r3n08:13436:13436 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n13:23995:23995 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.34<0> e08r2n13:23995:23995 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n15:22025:22025 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n15:22024:22024 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n13:23994:23994 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.34<0> e08r3n08:13436:13436 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n13:23994:23994 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n13:23995:23995 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n03:22737:22737 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.44<0> e08r3n03:22737:22737 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n13:23994:23994 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n18:753:753 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n18:754:754 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n18:755:755 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n18:751:751 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n03:22737:22737 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n10:18784:18784 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.51<0> e08r3n10:18784:18784 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n03:22738:22738 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.44<0> e08r3n03:22738:22738 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n10:18784:18784 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13437:13437 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.49<0> e08r3n08:13438:13438 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.49<0> e08r3n08:13437:13437 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n03:22738:22738 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13438:13438 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8675:8675 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.33<0> e08r2n12:8675:8675 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n08:13437:13437 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n08:13438:13438 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n16:13446:13446 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.37<0> e08r2n16:13446:13446 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n12:8675:8675 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n16:13446:13446 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n10:876:876 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.31<0> e08r3n05:24731:24731 [0] NCCL INFO Bootstrap : Using ib0:11.5.8.46<0> e08r3n05:24731:24731 [0] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:876:876 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:875:875 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.31<0> e08r2n10:875:875 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r2n10:876:876 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n05:24731:24731 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n10:875:875 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n05:24733:24733 [1] NCCL INFO Bootstrap : Using ib0:11.5.8.46<0> e08r3n05:24733:24733 [1] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n05:24733:24733 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n05:24735:24735 [3] NCCL INFO Bootstrap : Using ib0:11.5.8.46<0> e08r3n05:24735:24735 [3] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n05:24735:24735 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n05:24734:24734 [2] NCCL INFO Bootstrap : Using ib0:11.5.8.46<0> e08r3n05:24734:24734 [2] NCCL INFO Plugin name set by env to librccl-net-none.so e08r3n05:24734:24734 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n06:22281:22281 [0] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n06:22284:22284 [2] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n06:22283:22283 [1] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r3n06:22285:22285 [3] NCCL INFO NET/Plugin : No plugin found (librccl-net-none.so), using internal implementation e08r2n08:5142:6491 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.29<0> e08r2n08:5142:6491 [3] NCCL INFO Using network IB e08r2n08:5140:6524 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.29<0> e08r2n08:5140:6524 [1] NCCL INFO Using network IB e08r2n08:5141:6541 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.29<0> e08r2n08:5141:6541 [2] NCCL INFO Using network IB e08r3n07:4889:5932 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.48<0> e08r3n07:4889:5932 [0] NCCL INFO Using network IB e08r3n07:4891:5944 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.48<0> e08r3n07:4891:5944 [1] NCCL INFO Using network IB e08r3n10:18788:19808 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.51<0> e08r3n10:18788:19808 [3] NCCL INFO Using network IB e08r2n16:13442:14572 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.37<0> e08r2n16:13442:14572 [0] NCCL INFO Using network IB e08r2n16:13444:14576 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.37<0> e08r2n16:13444:14576 [1] NCCL INFO Using network IB e08r3n10:18787:19820 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.51<0> e08r3n10:18787:19820 [2] NCCL INFO Using network IB e08r2n19:9030:10143 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.40<0> e08r2n19:9030:10143 [0] NCCL INFO Using network IB e08r2n19:9032:10150 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.40<0> e08r2n19:9032:10150 [1] NCCL INFO Using network IB e08r3n11:29645:30741 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.52<0> e08r3n11:29645:30741 [0] NCCL INFO Using network IB e08r3n11:29649:30749 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.52<0> e08r3n11:29649:30749 [3] NCCL INFO Using network IB e08r3n11:29647:30751 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.52<0> e08r3n11:29647:30751 [1] NCCL INFO Using network IB e08r3n00:14532:15473 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.41<0> e08r3n00:14532:15473 [0] NCCL INFO Using network IB e08r3n03:22739:23827 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.44<0> e08r3n03:22739:23827 [3] NCCL INFO Using network IB e08r3n03:22735:23820 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.44<0> e08r3n03:22735:23820 [0] NCCL INFO Using network IB e08r2n19:9034:10156 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.40<0> e08r2n19:9034:10156 [3] NCCL INFO Using network IB e08r2n19:9033:10155 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.40<0> e08r2n19:9033:10155 [2] NCCL INFO Using network IB e08r2n09:27002:27953 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.30<0> e08r2n09:27002:27953 [0] NCCL INFO Using network IB e08r2n09:27004:27956 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.30<0> e08r2n09:27004:27956 [1] NCCL INFO Using network IB e08r3n09:8677:9721 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.50<0> e08r3n09:8677:9721 [1] NCCL INFO Using network IB e08r3n11:29648:30753 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.52<0> e08r3n11:29648:30753 [2] NCCL INFO Using network IB e08r3n09:8675:9723 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.50<0> e08r3n09:8675:9723 [0] NCCL INFO Using network IB e08r3n09:8679:9728 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.50<0> e08r3n09:8679:9728 [3] NCCL INFO Using network IB e08r3n00:14536:15487 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.41<0> e08r3n00:14536:15487 [3] NCCL INFO Using network IB e08r3n07:4893:5961 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.48<0> e08r3n07:4893:5961 [3] NCCL INFO Using network IB e08r2n11:5732:6769 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.32<0> e08r2n11:5732:6769 [1] NCCL INFO Using network IB e08r2n11:5730:6763 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.32<0> e08r2n11:5730:6763 [0] NCCL INFO Using network IB e08r3n10:18786:19830 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.51<0> e08r3n10:18786:19830 [1] NCCL INFO Using network IB e08r3n02:30401:31205 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.43<0> e08r3n02:30401:31205 [0] NCCL INFO Using network IB e08r3n02:30403:31209 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.43<0> e08r3n02:30403:31209 [1] NCCL INFO Using network IB e08r3n00:14534:15491 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.41<0> e08r3n00:14534:15491 [1] NCCL INFO Using network IB e08r3n02:30405:31208 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.43<0> e08r3n02:30405:31208 [3] NCCL INFO Using network IB e08r2n11:5734:6772 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.32<0> e08r2n11:5734:6772 [3] NCCL INFO Using network IB e08r2n11:5733:6773 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.32<0> e08r2n11:5733:6773 [2] NCCL INFO Using network IB e08r3n00:14535:15492 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.41<0> e08r3n00:14535:15492 [2] NCCL INFO Using network IB e08r2n09:27006:27966 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.30<0> e08r2n09:27006:27966 [3] NCCL INFO Using network IB e08r2n09:27005:27965 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.30<0> e08r2n09:27005:27965 [2] NCCL INFO Using network IB e08r2n15:22021:22997 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.36<0> e08r2n15:22021:22997 [0] NCCL INFO Using network IB e08r3n04:16938:17748 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.45<0> e08r3n04:16938:17748 [1] NCCL INFO Using network IB e08r3n02:30404:31213 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.43<0> e08r3n02:30404:31213 [2] NCCL INFO Using network IB e08r3n04:16936:17745 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.45<0> e08r3n04:16936:17745 [0] NCCL INFO Using network IB e08r3n04:16939:17749 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.45<0> e08r3n04:16939:17749 [2] NCCL INFO Using network IB e08r3n04:16940:17743 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.45<0> e08r3n04:16940:17743 [3] NCCL INFO Using network IB e08r3n07:4892:5963 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.48<0> e08r3n07:4892:5963 [2] NCCL INFO Using network IB e08r2n13:23991:25150 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.34<0> e08r2n13:23991:25150 [0] NCCL INFO Using network IB e08r2n15:22023:23011 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.36<0> e08r2n15:22023:23011 [1] NCCL INFO Using network IB e08r3n10:18784:19834 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.51<0> e08r3n10:18784:19834 [0] NCCL INFO Using network IB e08r2n13:23993:25161 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.34<0> e08r2n13:23993:25161 [1] NCCL INFO Using network IB e08r2n14:18195:19161 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.35<0> e08r2n14:18195:19161 [2] NCCL INFO Using network IB e08r2n14:18192:19156 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.35<0> e08r2n14:18192:19156 [0] NCCL INFO Using network IB e08r2n14:18196:19160 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.35<0> e08r2n14:18196:19160 [3] NCCL INFO Using network IB e08r2n17:21283:22448 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.38<0> e08r2n17:21283:22448 [2] NCCL INFO Using network IB e08r2n14:18194:19155 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.35<0> e08r2n14:18194:19155 [1] NCCL INFO Using network IB e08r3n01:6278:7261 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.42<0> e08r3n01:6278:7261 [2] NCCL INFO Using network IB e08r2n13:23995:25163 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.34<0> e08r2n13:23995:25163 [3] NCCL INFO Using network IB e08r3n01:6275:7256 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.42<0> e08r3n01:6275:7256 [0] NCCL INFO Using network IB e08r3n09:8678:9738 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.50<0> e08r3n09:8678:9738 [2] NCCL INFO Using network IB e08r3n03:22737:23845 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.44<0> e08r3n03:22737:23845 [1] NCCL INFO Using network IB e08r2n17:21282:22447 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.38<0> e08r2n17:21282:22447 [1] NCCL INFO Using network IB e08r3n01:6277:7260 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.42<0> e08r3n01:6277:7260 [1] NCCL INFO Using network IB e08r3n01:6279:7255 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.42<0> e08r3n01:6279:7255 [3] NCCL INFO Using network IB e08r2n17:21284:22443 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.38<0> e08r2n17:21284:22443 [3] NCCL INFO Using network IB e08r2n17:21280:22441 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.38<0> e08r2n17:21280:22441 [0] NCCL INFO Using network IB e08r2n15:22024:23016 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.36<0> e08r2n15:22024:23016 [2] NCCL INFO Using network IB e08r2n13:23994:25164 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.34<0> e08r2n16:13445:14603 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.37<0> e08r2n16:13445:14603 [2] NCCL INFO Using network IB e08r2n13:23994:25164 [2] NCCL INFO Using network IB e08r2n12:8674:9663 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.33<0> e08r2n12:8674:9663 [2] NCCL INFO Using network IB e08r2n15:22025:23017 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.36<0> e08r2n15:22025:23017 [3] NCCL INFO Using network IB e08r2n12:8671:9661 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.33<0> e08r2n12:8671:9661 [0] NCCL INFO Using network IB e08r2n12:8673:9656 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.33<0> e08r2n12:8673:9656 [1] NCCL INFO Using network IB e08r2n12:8675:9665 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.33<0> e08r2n12:8675:9665 [3] NCCL INFO Using network IB e08r3n03:22738:23847 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.44<0> e08r3n03:22738:23847 [2] NCCL INFO Using network IB e08r3n08:13436:14594 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.49<0> e08r3n08:13436:14594 [1] NCCL INFO Using network IB e08r3n08:13438:14591 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.49<0> e08r3n08:13438:14591 [3] NCCL INFO Using network IB e08r2n16:13446:14609 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.37<0> e08r2n16:13446:14609 [3] NCCL INFO Using network IB e08r2n18:751:1877 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.39<0> e08r2n18:751:1877 [0] NCCL INFO Using network IB e08r2n18:755:1882 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.39<0> e08r2n18:755:1882 [3] NCCL INFO Using network IB e08r2n18:753:1883 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.39<0> e08r2n18:753:1883 [1] NCCL INFO Using network IB e08r2n18:754:1880 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.39<0> e08r2n18:754:1880 [2] NCCL INFO Using network IB e08r3n08:13434:14586 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.49<0> e08r3n08:13434:14586 [0] NCCL INFO Using network IB e08r3n05:24735:25797 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.46<0> e08r3n05:24735:25797 [3] NCCL INFO Using network IB e08r3n05:24731:25791 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.46<0> e08r3n05:24731:25791 [0] NCCL INFO Using network IB e08r3n08:13437:14595 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.49<0> e08r3n08:13437:14595 [2] NCCL INFO Using network IB e08r2n10:872:1911 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.31<0> e08r2n10:872:1911 [0] NCCL INFO Using network IB e08r2n10:876:1918 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.31<0> e08r2n10:876:1918 [3] NCCL INFO Using network IB e08r2n10:874:1920 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.31<0> e08r2n10:874:1920 [1] NCCL INFO Using network IB e08r2n10:875:1919 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.31<0> e08r2n10:875:1919 [2] NCCL INFO Using network IB e08r3n05:24733:25802 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.46<0> e08r3n05:24733:25802 [1] NCCL INFO Using network IB e08r3n05:24734:25804 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.46<0> e08r3n05:24734:25804 [2] NCCL INFO Using network IB e08r3n06:22281:23330 [0] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.47<0> e08r3n06:22281:23330 [0] NCCL INFO Using network IB e08r3n06:22283:23339 [1] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.47<0> e08r3n06:22283:23339 [1] NCCL INFO Using network IB e08r3n06:22285:23335 [3] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.47<0> e08r3n06:22285:23335 [3] NCCL INFO Using network IB e08r3n06:22284:23338 [2] NCCL INFO NET/IB : Using [0]mlx5_0:1/IB [RO]; OOB ib0:11.5.8.47<0> e08r3n06:22284:23338 [2] NCCL INFO Using network IB e08r3n07:4893:5961 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n11:29647:30751 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n09:8679:9728 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n12:8673:9656 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n13:23993:25161 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n11:29648:30753 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n07:4891:5944 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n10:18787:19820 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n09:27002:27953 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n10:18788:19808 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n13:23991:25150 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n09:8678:9738 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n09:27004:27956 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n09:8675:9723 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n11:29645:30741 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n09:8677:9721 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n11:29649:30749 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n12:8675:9665 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n12:8674:9663 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n07:4889:5932 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n10:18786:19830 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n10:18784:19834 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n08:13434:14586 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n10:876:1918 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n08:5140:6524 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n08:13436:14594 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n08:5136:6335 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n12:8671:9661 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n08:13438:14591 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n08:13437:14595 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n13:23995:25163 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n07:4892:5963 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n06:22285:23335 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n10:875:1919 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n08:5142:6491 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n13:23994:25164 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n16:13442:14572 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n08:5141:6541 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n00:14536:15487 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n00:14535:15492 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n17:21282:22447 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n18:755:1882 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n09:27005:27965 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n09:27006:27966 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n17:21284:22443 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n16:13445:14603 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n02:30404:31213 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n16:13444:14576 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n17:21283:22448 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n16:13446:14609 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n17:21280:22441 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n18:753:1883 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n04:16940:17743 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n11:5732:6769 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n14:18192:19156 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n14:18194:19155 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n02:30405:31208 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n14:18196:19160 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n14:18195:19161 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n10:874:1920 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n11:5734:6772 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n01:6278:7261 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n06:22283:23339 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n11:5733:6773 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n10:872:1911 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n05:24731:25791 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n02:30401:31205 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n11:5730:6763 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n05:24733:25802 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n02:30403:31209 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n18:751:1877 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n05:24734:25804 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n18:754:1880 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n00:14532:15473 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n04:16939:17749 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n00:14534:15491 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n04:16938:17748 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n01:6279:7255 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n19:9032:10150 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n06:22284:23338 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n04:16936:17745 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n01:6277:7260 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n06:22281:23330 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n05:24735:25797 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n01:6275:7256 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n19:9034:10156 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n19:9033:10155 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n19:9030:10143 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n15:22021:22997 [0] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n15:22025:23017 [3] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n15:22023:23011 [1] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r2n15:22024:23016 [2] NCCL INFO rocm_smi_lib: version 2.8.0.0 e08r3n06:22285:23335 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n10:18787:19820 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27002:27953 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n10:18788:19808 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27004:27956 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n18:755:1882 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27005:27965 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22283:23339 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n16:13442:14572 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27006:27966 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22281:23330 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n16:13446:14609 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n10:18784:19834 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n08:13434:14586 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n11:5732:6769 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n18:753:1883 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n08:5140:6524 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n08:5136:6335 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n08:5142:6491 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22284:23338 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n16:13445:14603 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n10:18786:19830 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n08:13436:14594 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n11:5734:6772 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n18:751:1877 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n04:16940:17743 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n05:24731:25791 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n02:30404:31213 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n00:14536:15487 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n17:21282:22447 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n14:18192:19156 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n08:5141:6541 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22285:23335 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n16:13444:14576 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n10:18787:19820 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n08:13438:14591 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n11:5730:6763 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n18:754:1880 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n04:16936:17745 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n05:24733:25802 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n02:30405:31208 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n00:14535:15492 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n17:21284:22443 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n14:18196:19160 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n11:29647:30751 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n13:23993:25161 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n15:22021:22997 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27002:27953 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n19:9032:10150 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n09:8679:9728 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n10:876:1918 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n07:4893:5961 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n01:6278:7261 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n08:5140:6524 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n08:5136:6335 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n08:5142:6491 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n08:5141:6541 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n06:22283:23339 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n16:13442:14572 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n10:18788:19808 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n08:13437:14595 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n11:5733:6773 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n18:755:1882 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n04:16939:17749 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n05:24735:25797 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n02:30401:31205 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n00:14532:15473 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n17:21280:22441 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n14:18194:19155 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n11:29645:30741 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n13:23991:25150 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n15:22023:23011 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27004:27956 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n19:9034:10156 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n09:8675:9723 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n10:872:1911 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n07:4891:5944 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n01:6279:7255 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n12:8673:9656 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22281:23330 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n16:13446:14609 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n10:18784:19834 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n08:13434:14586 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n11:5732:6769 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n18:753:1883 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n04:16938:17748 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n05:24734:25804 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n02:30403:31209 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n00:14534:15491 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n17:21283:22448 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n14:18195:19161 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n11:29649:30749 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n13:23995:25163 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n15:22025:23017 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27005:27965 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n19:9030:10143 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n09:8678:9738 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n10:875:1919 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n07:4889:5932 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n01:6277:7260 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n12:8674:9663 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n06:22284:23338 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n16:13445:14603 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n10:18786:19830 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n08:13436:14594 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n11:5734:6772 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n18:751:1877 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n04:16940:17743 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n05:24731:25791 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n02:30404:31213 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n00:14536:15487 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n17:21282:22447 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n14:18192:19156 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n11:29648:30753 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n13:23994:25164 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n15:22024:23016 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n09:27006:27966 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n19:9033:10155 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n09:8677:9721 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n10:874:1920 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n07:4892:5963 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n01:6275:7256 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n12:8675:9665 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r2n16:13444:14576 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n08:13438:14591 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n11:5730:6763 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n18:754:1880 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n04:16936:17745 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n05:24733:25802 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n02:30405:31208 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n00:14532:15473 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n17:21284:22443 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n14:18196:19160 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n11:29647:30751 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n13:23993:25161 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n15:22021:22997 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n19:9032:10150 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n09:8679:9728 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n10:876:1918 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n07:4893:5961 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n01:6278:7261 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n12:8671:9661 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n08:13437:14595 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n11:5733:6773 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n04:16939:17749 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n05:24735:25797 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n02:30401:31205 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n00:14535:15492 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n17:21280:22441 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n14:18194:19155 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n11:29645:30741 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n13:23991:25150 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n15:22023:23011 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n19:9034:10156 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n09:8675:9723 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n10:872:1911 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n07:4891:5944 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n01:6279:7255 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n12:8673:9656 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n04:16938:17748 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n05:24734:25804 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n02:30403:31209 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n00:14534:15491 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n17:21283:22448 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n14:18195:19161 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n11:29649:30749 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n13:23995:25163 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n15:22025:23017 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n19:9030:10143 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n09:8678:9738 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n10:874:1920 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n07:4889:5932 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n01:6275:7256 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n12:8674:9663 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n11:29648:30753 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n13:23994:25164 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n15:22024:23016 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n19:9033:10155 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n09:8677:9721 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n10:875:1919 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n07:4892:5963 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n01:6277:7260 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n12:8675:9665 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n12:8671:9661 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n03:22737:23845 [1] /data/jenkins_workspace/workspace/rccl_release/src/misc/rocm_smi_wrap.cc:38 NCCL WARN ROCm SMI init failure An error occurred during initialization, during monitor discovery or when when initializing internal data structures e08r3n03:22739:23827 [3] /data/jenkins_workspace/workspace/rccl_release/src/misc/rocm_smi_wrap.cc:38 NCCL WARN ROCm SMI init failure An error occurred during initialization, during monitor discovery or when when initializing internal data structures e08r3n03:22735:23820 [0] /data/jenkins_workspace/workspace/rccl_release/src/misc/rocm_smi_wrap.cc:38 NCCL WARN ROCm SMI init failure An error occurred during initialization, during monitor discovery or when when initializing internal data structures e08r3n03:22738:23847 [2] /data/jenkins_workspace/workspace/rccl_release/src/misc/rocm_smi_wrap.cc:38 NCCL WARN ROCm SMI init failure An error occurred during initialization, during monitor discovery or when when initializing internal data structures e08r3n03:22737:23845 [1] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n03:22735:23820 [0] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n03:22738:23847 [2] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n03:22739:23827 [3] NCCL INFO NCCL_P2P_LEVEL set by environment to SYS e08r3n03:22737:23845 [1] NCCL INFO Setting affinity for GPU 0 to ff00 e08r3n03:22735:23820 [0] NCCL INFO Setting affinity for GPU 116699136 to ff e08r3n03:22738:23847 [2] NCCL INFO Setting affinity for GPU 0 to ff0000 e08r3n03:22739:23827 [3] NCCL INFO Setting affinity for GPU 0 to ff000000 e08r3n03:22739:23827 [3] NCCL INFO Trees [0] -1/-1/-1->63->62 [1] -1/-1/-1->63->62 comm 0x2b0524000ab0 nRanks 96 busId 63000 e08r3n05:24735:25797 [3] NCCL INFO Trees [0] -1/-1/-1->71->70 [1] -1/-1/-1->71->70 comm 0x2ac218000ab0 nRanks 96 busId 63000 e08r3n05:24731:25791 [0] NCCL INFO Trees [0] 69/-1/-1->68->73 [1] 69/64/-1->68->76 comm 0x2b85d4000ab0 nRanks 96 busId 4000 e08r3n06:22283:23339 [1] NCCL INFO Trees [0] 74/68/-1->73->72 [1] 74/-1/-1->73->72 comm 0x2b9a88000ab0 nRanks 96 busId 26000 e08r3n08:13436:14594 [1] NCCL INFO Trees [0] 82/72/-1->81->80 [1] 82/-1/-1->81->80 comm 0x2b1954000ab0 nRanks 96 busId 26000 e08r3n06:22281:23330 [0] NCCL INFO Trees [0] 73/76/-1->72->81 [1] 73/-1/-1->72->69 comm 0x2af9e0000ab0 nRanks 96 busId 4000 e08r3n08:13437:14595 [2] NCCL INFO Trees [0] 83/-1/-1->82->81 [1] 83/-1/-1->82->81 comm 0x2b8f38000ab0 nRanks 96 busId 43000 e08r3n04:16938:17748 [1] NCCL INFO Trees [0] 66/32/-1->65->64 [1] 66/-1/-1->65->64 comm 0x2b0b78000ab0 nRanks 96 busId 26000 e08r3n05:24733:25802 [1] NCCL INFO Trees [0] 70/-1/-1->69->68 [1] 70/72/-1->69->68 comm 0x2ab9d4000ab0 nRanks 96 busId 26000 e08r3n06:22284:23338 [2] NCCL INFO Trees [0] 75/-1/-1->74->73 [1] 75/-1/-1->74->73 comm 0x2b141c000ab0 nRanks 96 busId 43000 e08r3n08:13434:14586 [0] NCCL INFO Trees [0] 81/88/-1->80->64 [1] 81/-1/-1->80->84 comm 0x2abcf4000ab0 nRanks 96 busId 4000 e08r3n04:16940:17743 [3] NCCL INFO Trees [0] -1/-1/-1->67->66 [1] -1/-1/-1->67->66 comm 0x2b1e28000ab0 nRanks 96 busId 63000 e08r3n05:24734:25804 [2] NCCL INFO Trees [0] 71/-1/-1->70->69 [1] 71/-1/-1->70->69 comm 0x2b26b0000ab0 nRanks 96 busId 43000 e08r3n07:4893:5961 [3] NCCL INFO Trees [0] -1/-1/-1->79->78 [1] -1/-1/-1->79->78 comm 0x2ba69c000ab0 nRanks 96 busId 63000 e08r3n06:22285:23335 [3] NCCL INFO Trees [0] -1/-1/-1->75->74 [1] -1/-1/-1->75->74 comm 0x2b91b4000ab0 nRanks 96 busId 63000 e08r3n08:13438:14591 [3] NCCL INFO Trees [0] -1/-1/-1->83->82 [1] -1/-1/-1->83->82 comm 0x2b2614000ab0 nRanks 96 busId 63000 e08r3n04:16939:17749 [2] NCCL INFO Trees [0] 67/-1/-1->66->65 [1] 67/-1/-1->66->65 comm 0x2b4eb4000ab0 nRanks 96 busId 43000 e08r3n07:4892:5963 [2] NCCL INFO Trees [0] 79/-1/-1->78->77 [1] 79/-1/-1->78->77 comm 0x2b9670000ab0 nRanks 96 busId 43000 e08r3n04:16936:17745 [0] NCCL INFO Trees [0] 65/80/-1->64->0 [1] 65/-1/-1->64->68 comm 0x2b3574000ab0 nRanks 96 busId 4000 e08r3n07:4889:5932 [0] NCCL INFO Trees [0] 77/-1/-1->76->72 [1] 77/68/-1->76->61 comm 0x2aed78000ab0 nRanks 96 busId 4000 e08r3n07:4891:5944 [1] NCCL INFO Trees [0] 78/-1/-1->77->76 [1] 78/84/-1->77->76 comm 0x2b7a94000ab0 nRanks 96 busId 26000 e08r3n10:18786:19830 [1] NCCL INFO Trees [0] 90/84/-1->89->88 [1] 90/-1/-1->89->88 comm 0x2ac35c000ab0 nRanks 96 busId 26000 e08r3n09:8675:9723 [0] NCCL INFO Trees [0] 85/-1/-1->84->89 [1] 85/80/-1->84->77 comm 0x2b416c000ab0 nRanks 96 busId 4000 e08r3n10:18784:19834 [0] NCCL INFO Trees [0] 89/92/-1->88->80 [1] 89/-1/-1->88->85 comm 0x2af008000ab0 nRanks 96 busId 4000 e08r3n09:8677:9721 [1] NCCL INFO Trees [0] 86/-1/-1->85->84 [1] 86/88/-1->85->84 comm 0x2b4344000ab0 nRanks 96 busId 26000 e08r3n10:18788:19808 [3] NCCL INFO Trees [0] -1/-1/-1->91->90 [1] -1/-1/-1->91->90 comm 0x2ad848000ab0 nRanks 96 busId 63000 e08r3n09:8679:9728 [3] NCCL INFO Trees [0] -1/-1/-1->87->86 [1] -1/-1/-1->87->86 comm 0x2b0c4c000ab0 nRanks 96 busId 63000 e08r3n11:29645:30741 [0] NCCL INFO Trees [0] 93/-1/-1->92->88 [1] 93/28/-1->92->-1 comm 0x2ac238000ab0 nRanks 96 busId 4000 e08r3n10:18787:19820 [2] NCCL INFO Trees [0] 91/-1/-1->90->89 [1] 91/-1/-1->90->89 comm 0x2ae6c4000ab0 nRanks 96 busId 43000 e08r3n09:8678:9738 [2] NCCL INFO Trees [0] 87/-1/-1->86->85 [1] 87/-1/-1->86->85 comm 0x2b20f8000ab0 nRanks 96 busId 43000 e08r3n11:29647:30751 [1] NCCL INFO Trees [0] 94/-1/-1->93->92 [1] 94/-1/-1->93->92 comm 0x2abd10000ab0 nRanks 96 busId 26000 e08r3n11:29648:30753 [2] NCCL INFO Trees [0] 95/-1/-1->94->93 [1] 95/-1/-1->94->93 comm 0x2b8da8000ab0 nRanks 96 busId 43000 e08r3n11:29649:30749 [3] NCCL INFO Trees [0] -1/-1/-1->95->94 [1] -1/-1/-1->95->94 comm 0x2ba6ec000ab0 nRanks 96 busId 63000 e08r2n08:5136:6335 [0] NCCL INFO Channel 00/02 : 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 e08r2n08:5136:6335 [0] NCCL INFO Channel 01/02 : 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 e08r2n08:5136:6335 [0] NCCL INFO Trees [0] 1/64/-1->0->-1 [1] 1/-1/-1->0->4 comm 0x2b2e44000ab0 nRanks 96 busId 4000 e08r2n08:5140:6524 [1] NCCL INFO Trees [0] 2/-1/-1->1->0 [1] 2/-1/-1->1->0 comm 0x2b30cc000ab0 nRanks 96 busId 26000 e08r2n08:5141:6541 [2] NCCL INFO Trees [0] 3/-1/-1->2->1 [1] 3/-1/-1->2->1 comm 0x2b5bd8000ab0 nRanks 96 busId 43000 e08r2n08:5142:6491 [3] NCCL INFO Trees [0] -1/-1/-1->3->2 [1] -1/-1/-1->3->2 comm 0x2ad4a8000ab0 nRanks 96 busId 63000 e08r2n09:27002:27953 [0] NCCL INFO Trees [0] 5/-1/-1->4->9 [1] 5/0/-1->4->12 comm 0x2b0d1c000ab0 nRanks 96 busId 4000 e08r2n09:27004:27956 [1] NCCL INFO Trees [0] 6/-1/-1->5->4 [1] 6/8/-1->5->4 comm 0x2af6e0000ab0 nRanks 96 busId 26000 e08r2n09:27006:27966 [3] NCCL INFO Trees [0] -1/-1/-1->7->6 [1] -1/-1/-1->7->6 comm 0x2b56e4000ab0 nRanks 96 busId 63000 e08r2n10:874:1920 [1] NCCL INFO Trees [0] 10/4/-1->9->8 [1] 10/-1/-1->9->8 comm 0x2b1f10000ab0 nRanks 96 busId 26000 e08r2n09:27005:27965 [2] NCCL INFO Trees [0] 7/-1/-1->6->5 [1] 7/-1/-1->6->5 comm 0x2b3e48000ab0 nRanks 96 busId 43000 e08r2n10:872:1911 [0] NCCL INFO Trees [0] 9/12/-1->8->17 [1] 9/-1/-1->8->5 comm 0x2b6040000ab0 nRanks 96 busId 4000 e08r2n10:876:1918 [3] NCCL INFO Trees [0] -1/-1/-1->11->10 [1] -1/-1/-1->11->10 comm 0x2b2d0c000ab0 nRanks 96 busId 63000 e08r2n10:875:1919 [2] NCCL INFO Trees [0] 11/-1/-1->10->9 [1] 11/-1/-1->10->9 comm 0x2af8c4000ab0 nRanks 96 busId 43000 e08r2n11:5730:6763 [0] NCCL INFO Trees [0] 13/-1/-1->12->8 [1] 13/4/-1->12->28 comm 0x2b7a5c000ab0 nRanks 96 busId 4000 e08r2n11:5732:6769 [1] NCCL INFO Trees [0] 14/-1/-1->13->12 [1] 14/20/-1->13->12 comm 0x2b11a0000ab0 nRanks 96 busId 26000 e08r2n11:5733:6773 [2] NCCL INFO Trees [0] 15/-1/-1->14->13 [1] 15/-1/-1->14->13 comm 0x2ae6f0000ab0 nRanks 96 busId 43000 e08r2n11:5734:6772 [3] NCCL INFO Trees [0] -1/-1/-1->15->14 [1] -1/-1/-1->15->14 comm 0x2b4144000ab0 nRanks 96 busId 63000 e08r2n12:8671:9661 [0] NCCL INFO Trees [0] 17/24/-1->16->33 [1] 17/-1/-1->16->20 comm 0x2b66f4000ab0 nRanks 96 busId 4000 e08r2n12:8673:9656 [1] NCCL INFO Trees [0] 18/8/-1->17->16 [1] 18/-1/-1->17->16 comm 0x2b92b8000ab0 nRanks 96 busId 26000 e08r2n12:8674:9663 [2] NCCL INFO Trees [0] 19/-1/-1->18->17 [1] 19/-1/-1->18->17 comm 0x2b65a0000ab0 nRanks 96 busId 43000 e08r2n12:8675:9665 [3] NCCL INFO Trees [0] -1/-1/-1->19->18 [1] -1/-1/-1->19->18 comm 0x2b2e18000ab0 nRanks 96 busId 63000 e08r3n08:13434:14586 [0] NCCL INFO Channel 00/0 : 79[63000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 00/0 : 75[63000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Trees [0] 21/-1/-1->20->25 [1] 21/16/-1->20->13 comm 0x2b5014000ab0 nRanks 96 busId 4000 e08r3n05:24731:25791 [0] NCCL INFO Channel 00/0 : 67[63000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 00/0 : 63[63000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r2n13:23993:25161 [1] NCCL INFO Trees [0] 22/-1/-1->21->20 [1] 22/24/-1->21->20 comm 0x2b4058000ab0 nRanks 96 busId 26000 e08r3n06:22281:23330 [0] NCCL INFO Channel 00/0 : 71[63000] -> 72[4000] [receive] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Channel 00 : 73[26000] -> 74[43000] via P2P/IPC comm 0x2b9a88000ab0 nRanks 96 e08r2n13:23994:25164 [2] NCCL INFO Trees [0] 23/-1/-1->22->21 [1] 23/-1/-1->22->21 comm 0x2b5d8c000ab0 nRanks 96 busId 43000 e08r3n08:13437:14595 [2] NCCL INFO Channel 00 : 82[43000] -> 83[63000] via P2P/IPC comm 0x2b8f38000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Channel 00 : 69[26000] -> 70[43000] via P2P/IPC comm 0x2ab9d4000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Channel 00 : 81[26000] -> 82[43000] via P2P/IPC comm 0x2b1954000ab0 nRanks 96 e08r2n13:23995:25163 [3] NCCL INFO Trees [0] -1/-1/-1->23->22 [1] -1/-1/-1->23->22 comm 0x2b4b08000ab0 nRanks 96 busId 63000 e08r3n05:24734:25804 [2] NCCL INFO Channel 00 : 70[43000] -> 71[63000] via P2P/IPC comm 0x2b26b0000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 00 : 77[26000] -> 78[43000] via P2P/IPC comm 0x2b7a94000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO Channel 00 : 74[43000] -> 75[63000] via P2P/IPC comm 0x2b141c000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 00 : 65[26000] -> 66[43000] via P2P/IPC comm 0x2b0b78000ab0 nRanks 96 e08r3n04:16939:17749 [2] NCCL INFO Channel 00 : 66[43000] -> 67[63000] via P2P/IPC comm 0x2b4eb4000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 00/0 : 83[63000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n07:4892:5963 [2] NCCL INFO Channel 00 : 78[43000] -> 79[63000] via P2P/IPC comm 0x2b9670000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00/0 : 87[63000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Channel 01 : 81[26000] -> 82[43000] via P2P/IPC comm 0x2b1954000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Channel 00 : 85[26000] -> 86[43000] via P2P/IPC comm 0x2b4344000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 00 : 89[26000] -> 90[43000] via P2P/IPC comm 0x2ac35c000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 00/0 : 91[63000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r3n09:8678:9738 [2] NCCL INFO Channel 00 : 86[43000] -> 87[63000] via P2P/IPC comm 0x2b20f8000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Channel 01 : 73[26000] -> 74[43000] via P2P/IPC comm 0x2b9a88000ab0 nRanks 96 e08r3n05:24734:25804 [2] NCCL INFO Channel 01 : 70[43000] -> 71[63000] via P2P/IPC comm 0x2b26b0000ab0 nRanks 96 e08r3n11:29647:30751 [1] NCCL INFO Channel 00 : 93[26000] -> 94[43000] via P2P/IPC comm 0x2abd10000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Channel 01 : 69[26000] -> 70[43000] via P2P/IPC comm 0x2ab9d4000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 01 : 65[26000] -> 66[43000] via P2P/IPC comm 0x2b0b78000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 00/0 : 95[63000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO Channel 01 : 74[43000] -> 75[63000] via P2P/IPC comm 0x2b141c000ab0 nRanks 96 e08r3n08:13437:14595 [2] NCCL INFO Channel 01 : 82[43000] -> 83[63000] via P2P/IPC comm 0x2b8f38000ab0 nRanks 96 e08r3n10:18787:19820 [2] NCCL INFO Channel 00 : 90[43000] -> 91[63000] via P2P/IPC comm 0x2ae6c4000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 01 : 89[26000] -> 90[43000] via P2P/IPC comm 0x2ac35c000ab0 nRanks 96 e08r3n04:16939:17749 [2] NCCL INFO Channel 01 : 66[43000] -> 67[63000] via P2P/IPC comm 0x2b4eb4000ab0 nRanks 96 e08r3n07:4892:5963 [2] NCCL INFO Channel 01 : 78[43000] -> 79[63000] via P2P/IPC comm 0x2b9670000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Trees [0] 26/20/-1->25->24 [1] 26/-1/-1->25->24 comm 0x2b43b4000ab0 nRanks 96 busId 26000 e08r2n14:18195:19161 [2] NCCL INFO Trees [0] 27/-1/-1->26->25 [1] 27/-1/-1->26->25 comm 0x2b74c4000ab0 nRanks 96 busId 43000 e08r2n15:22021:22997 [0] NCCL INFO Trees [0] 29/-1/-1->28->24 [1] 29/12/-1->28->92 comm 0x2b5d18000ab0 nRanks 96 busId 4000 e08r3n09:8678:9738 [2] NCCL INFO Channel 01 : 86[43000] -> 87[63000] via P2P/IPC comm 0x2b20f8000ab0 nRanks 96 e08r2n14:18196:19160 [3] NCCL INFO Trees [0] -1/-1/-1->27->26 [1] -1/-1/-1->27->26 comm 0x2ab5e8000ab0 nRanks 96 busId 63000 e08r2n15:22023:23011 [1] NCCL INFO Trees [0] 30/-1/-1->29->28 [1] 30/60/-1->29->28 comm 0x2ad4b8000ab0 nRanks 96 busId 26000 e08r3n09:8677:9721 [1] NCCL INFO Channel 01 : 85[26000] -> 86[43000] via P2P/IPC comm 0x2b4344000ab0 nRanks 96 e08r3n11:29648:30753 [2] NCCL INFO Channel 00 : 94[43000] -> 95[63000] via P2P/IPC comm 0x2b8da8000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 01 : 77[26000] -> 78[43000] via P2P/IPC comm 0x2b7a94000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Trees [0] 25/28/-1->24->16 [1] 25/-1/-1->24->21 comm 0x2b88b4000ab0 nRanks 96 busId 4000 e08r2n15:22024:23016 [2] NCCL INFO Trees [0] 31/-1/-1->30->29 [1] 31/-1/-1->30->29 comm 0x2b123c000ab0 nRanks 96 busId 43000 e08r2n16:13442:14572 [0] NCCL INFO Trees [0] 33/48/-1->32->65 [1] 33/-1/-1->32->36 comm 0x2b4aa4000ab0 nRanks 96 busId 4000 e08r3n10:18787:19820 [2] NCCL INFO Channel 01 : 90[43000] -> 91[63000] via P2P/IPC comm 0x2ae6c4000ab0 nRanks 96 e08r2n17:21282:22447 [1] NCCL INFO Trees [0] 38/-1/-1->37->36 [1] 38/40/-1->37->36 comm 0x2abf00000ab0 nRanks 96 busId 26000 e08r2n08:5140:6524 [1] NCCL INFO Channel 00 : 1[26000] -> 2[43000] via P2P/IPC comm 0x2b30cc000ab0 nRanks 96 e08r2n08:5141:6541 [2] NCCL INFO Channel 00 : 2[43000] -> 3[63000] via P2P/IPC comm 0x2b5bd8000ab0 nRanks 96 e08r2n15:22025:23017 [3] NCCL INFO Trees [0] -1/-1/-1->31->30 [1] -1/-1/-1->31->30 comm 0x2b3208000ab0 nRanks 96 busId 63000 e08r2n16:13446:14609 [3] NCCL INFO Trees [0] -1/-1/-1->35->34 [1] -1/-1/-1->35->34 comm 0x2abfb8000ab0 nRanks 96 busId 63000 e08r2n17:21284:22443 [3] NCCL INFO Trees [0] -1/-1/-1->39->38 [1] -1/-1/-1->39->38 comm 0x2ba520000ab0 nRanks 96 busId 63000 e08r3n11:29647:30751 [1] NCCL INFO Channel 01 : 93[26000] -> 94[43000] via P2P/IPC comm 0x2abd10000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Trees [0] 51/-1/-1->50->49 [1] 51/-1/-1->50->49 comm 0x2baf68000ab0 nRanks 96 busId 43000 e08r3n03:22738:23847 [2] NCCL INFO Trees [0] 63/-1/-1->62->61 [1] 63/-1/-1->62->61 comm 0x2af43c000ab0 nRanks 96 busId 43000 e08r2n16:13444:14576 [1] NCCL INFO Trees [0] 34/16/-1->33->32 [1] 34/-1/-1->33->32 comm 0x2b0180000ab0 nRanks 96 busId 26000 e08r2n17:21280:22441 [0] NCCL INFO Trees [0] 37/-1/-1->36->41 [1] 37/32/-1->36->44 comm 0x2aff88000ab0 nRanks 96 busId 4000 e08r3n11:29648:30753 [2] NCCL INFO Channel 01 : 94[43000] -> 95[63000] via P2P/IPC comm 0x2b8da8000ab0 nRanks 96 e08r3n00:14536:15487 [3] NCCL INFO Trees [0] -1/-1/-1->51->50 [1] -1/-1/-1->51->50 comm 0x2b7774000ab0 nRanks 96 busId 63000 e08r3n03:22737:23845 [1] NCCL INFO Trees [0] 62/-1/-1->61->60 [1] 62/76/-1->61->60 comm 0x2ac6a0000ab0 nRanks 96 busId 26000 e08r2n19:9034:10156 [3] NCCL INFO Trees [0] -1/-1/-1->47->46 [1] -1/-1/-1->47->46 comm 0x2b6940000ab0 nRanks 96 busId 63000 e08r3n02:30405:31208 [3] NCCL INFO Trees [0] -1/-1/-1->59->58 [1] -1/-1/-1->59->58 comm 0x2b6924000ab0 nRanks 96 busId 63000 e08r3n01:6275:7256 [0] NCCL INFO Trees [0] 53/-1/-1->52->57 [1] 53/48/-1->52->45 comm 0x2b8738000ab0 nRanks 96 busId 4000 e08r2n09:27002:27953 [0] NCCL INFO Channel 00/0 : 3[63000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r2n08:5140:6524 [1] NCCL INFO Channel 01 : 1[26000] -> 2[43000] via P2P/IPC comm 0x2b30cc000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Trees [0] 35/-1/-1->34->33 [1] 35/-1/-1->34->33 comm 0x2b67e4000ab0 nRanks 96 busId 43000 e08r2n17:21283:22448 [2] NCCL INFO Trees [0] 39/-1/-1->38->37 [1] 39/-1/-1->38->37 comm 0x2b9724000ab0 nRanks 96 busId 43000 e08r3n00:14534:15491 [1] NCCL INFO Trees [0] 50/40/-1->49->48 [1] 50/-1/-1->49->48 comm 0x2b8bd0000ab0 nRanks 96 busId 26000 e08r3n03:22735:23820 [0] NCCL INFO Trees [0] 61/-1/-1->60->56 [1] 61/44/-1->60->29 comm 0x2b4504000ab0 nRanks 96 busId 4000 e08r2n19:9033:10155 [2] NCCL INFO Trees [0] 47/-1/-1->46->45 [1] 47/-1/-1->46->45 comm 0x2b03ac000ab0 nRanks 96 busId 43000 e08r3n02:30404:31213 [2] NCCL INFO Trees [0] 59/-1/-1->58->57 [1] 59/-1/-1->58->57 comm 0x2b67ac000ab0 nRanks 96 busId 43000 e08r3n01:6278:7261 [2] NCCL INFO Trees [0] 55/-1/-1->54->53 [1] 55/-1/-1->54->53 comm 0x2b101c000ab0 nRanks 96 busId 43000 e08r2n09:27004:27956 [1] NCCL INFO Channel 00 : 5[26000] -> 6[43000] via P2P/IPC comm 0x2af6e0000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00/0 : 7[63000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n18:755:1882 [3] NCCL INFO Trees [0] -1/-1/-1->43->42 [1] -1/-1/-1->43->42 comm 0x2b7fac000ab0 nRanks 96 busId 63000 e08r2n08:5141:6541 [2] NCCL INFO Channel 01 : 2[43000] -> 3[63000] via P2P/IPC comm 0x2b5bd8000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Trees [0] 49/56/-1->48->32 [1] 49/-1/-1->48->52 comm 0x2abe48000ab0 nRanks 96 busId 4000 e08r2n19:9032:10150 [1] NCCL INFO Trees [0] 46/-1/-1->45->44 [1] 46/52/-1->45->44 comm 0x2af5f8000ab0 nRanks 96 busId 26000 e08r3n02:30401:31205 [0] NCCL INFO Trees [0] 57/60/-1->56->48 [1] 57/-1/-1->56->53 comm 0x2bab5c000ab0 nRanks 96 busId 4000 e08r3n01:6279:7255 [3] NCCL INFO Trees [0] -1/-1/-1->55->54 [1] -1/-1/-1->55->54 comm 0x2aea58000ab0 nRanks 96 busId 63000 e08r2n09:27005:27965 [2] NCCL INFO Channel 00 : 6[43000] -> 7[63000] via P2P/IPC comm 0x2b3e48000ab0 nRanks 96 e08r2n10:875:1919 [2] NCCL INFO Channel 00 : 10[43000] -> 11[63000] via P2P/IPC comm 0x2af8c4000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Trees [0] 43/-1/-1->42->41 [1] 43/-1/-1->42->41 comm 0x2b2a28000ab0 nRanks 96 busId 43000 e08r2n11:5730:6763 [0] NCCL INFO Channel 00/0 : 11[63000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Trees [0] 45/-1/-1->44->40 [1] 45/36/-1->44->60 comm 0x2ab408000ab0 nRanks 96 busId 4000 e08r3n02:30403:31209 [1] NCCL INFO Trees [0] 58/52/-1->57->56 [1] 58/-1/-1->57->56 comm 0x2ba198000ab0 nRanks 96 busId 26000 e08r3n01:6277:7260 [1] NCCL INFO Trees [0] 54/-1/-1->53->52 [1] 54/56/-1->53->52 comm 0x2ba34c000ab0 nRanks 96 busId 26000 e08r2n09:27004:27956 [1] NCCL INFO Channel 01 : 5[26000] -> 6[43000] via P2P/IPC comm 0x2af6e0000ab0 nRanks 96 e08r2n10:874:1920 [1] NCCL INFO Channel 00 : 9[26000] -> 10[43000] via P2P/IPC comm 0x2b1f10000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Trees [0] 42/36/-1->41->40 [1] 42/-1/-1->41->40 comm 0x2b30f4000ab0 nRanks 96 busId 26000 e08r2n11:5733:6773 [2] NCCL INFO Channel 00 : 14[43000] -> 15[63000] via P2P/IPC comm 0x2ae6f0000ab0 nRanks 96 e08r2n09:27005:27965 [2] NCCL INFO Channel 01 : 6[43000] -> 7[63000] via P2P/IPC comm 0x2b3e48000ab0 nRanks 96 e08r2n10:874:1920 [1] NCCL INFO Channel 01 : 9[26000] -> 10[43000] via P2P/IPC comm 0x2b1f10000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Trees [0] 41/44/-1->40->49 [1] 41/-1/-1->40->37 comm 0x2b8134000ab0 nRanks 96 busId 4000 e08r2n11:5732:6769 [1] NCCL INFO Channel 00 : 13[26000] -> 14[43000] via P2P/IPC comm 0x2b11a0000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00/0 : 15[63000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n10:875:1919 [2] NCCL INFO Channel 01 : 10[43000] -> 11[63000] via P2P/IPC comm 0x2af8c4000ab0 nRanks 96 e08r2n11:5733:6773 [2] NCCL INFO Channel 01 : 14[43000] -> 15[63000] via P2P/IPC comm 0x2ae6f0000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 00 : 17[26000] -> 18[43000] via P2P/IPC comm 0x2b92b8000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 00/0 : 19[63000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO Channel 00 : 18[43000] -> 19[63000] via P2P/IPC comm 0x2b65a0000ab0 nRanks 96 e08r2n11:5732:6769 [1] NCCL INFO Channel 01 : 13[26000] -> 14[43000] via P2P/IPC comm 0x2b11a0000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 01 : 17[26000] -> 18[43000] via P2P/IPC comm 0x2b92b8000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO Channel 01 : 18[43000] -> 19[63000] via P2P/IPC comm 0x2b65a0000ab0 nRanks 96 e08r2n13:23993:25161 [1] NCCL INFO Channel 00 : 21[26000] -> 22[43000] via P2P/IPC comm 0x2b4058000ab0 nRanks 96 e08r2n13:23994:25164 [2] NCCL INFO Channel 00 : 22[43000] -> 23[63000] via P2P/IPC comm 0x2b5d8c000ab0 nRanks 96 e08r2n13:23993:25161 [1] NCCL INFO Channel 01 : 21[26000] -> 22[43000] via P2P/IPC comm 0x2b4058000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 00/0 : 27[63000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r2n13:23994:25164 [2] NCCL INFO Channel 01 : 22[43000] -> 23[63000] via P2P/IPC comm 0x2b5d8c000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 00/0 : 35[63000] -> 36[4000] [receive] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 00/0 : 23[63000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00/0 : 31[63000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r2n15:22023:23011 [1] NCCL INFO Channel 00 : 29[26000] -> 30[43000] via P2P/IPC comm 0x2ad4b8000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 00 : 25[26000] -> 26[43000] via P2P/IPC comm 0x2b43b4000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 00/0 : 51[63000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 00/0 : 59[63000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Channel 00 : 62[43000] -> 63[63000] via P2P/IPC comm 0x2af43c000ab0 nRanks 96 e08r2n14:18195:19161 [2] NCCL INFO Channel 00 : 26[43000] -> 27[63000] via P2P/IPC comm 0x2b74c4000ab0 nRanks 96 e08r3n03:22737:23845 [1] NCCL INFO Channel 00 : 61[26000] -> 62[43000] via P2P/IPC comm 0x2ac6a0000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Channel 00 : 34[43000] -> 35[63000] via P2P/IPC comm 0x2b67e4000ab0 nRanks 96 e08r2n17:21282:22447 [1] NCCL INFO Channel 00 : 37[26000] -> 38[43000] via P2P/IPC comm 0x2abf00000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 00/0 : 43[63000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r2n17:21283:22448 [2] NCCL INFO Channel 00 : 38[43000] -> 39[63000] via P2P/IPC comm 0x2b9724000ab0 nRanks 96 e08r2n19:9033:10155 [2] NCCL INFO Channel 00 : 46[43000] -> 47[63000] via P2P/IPC comm 0x2b03ac000ab0 nRanks 96 e08r2n15:22024:23016 [2] NCCL INFO Channel 00 : 30[43000] -> 31[63000] via P2P/IPC comm 0x2b123c000ab0 nRanks 96 e08r2n16:13444:14576 [1] NCCL INFO Channel 00 : 33[26000] -> 34[43000] via P2P/IPC comm 0x2b0180000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 00/0 : 47[63000] -> 48[4000] [receive] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Channel 00 : 50[43000] -> 51[63000] via P2P/IPC comm 0x2baf68000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Channel 01 : 62[43000] -> 63[63000] via P2P/IPC comm 0x2af43c000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 00/0 : 39[63000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n01:6278:7261 [2] NCCL INFO Channel 00 : 54[43000] -> 55[63000] via P2P/IPC comm 0x2b101c000ab0 nRanks 96 e08r2n15:22023:23011 [1] NCCL INFO Channel 01 : 29[26000] -> 30[43000] via P2P/IPC comm 0x2ad4b8000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 01 : 25[26000] -> 26[43000] via P2P/IPC comm 0x2b43b4000ab0 nRanks 96 e08r2n14:18195:19161 [2] NCCL INFO Channel 01 : 26[43000] -> 27[63000] via P2P/IPC comm 0x2b74c4000ab0 nRanks 96 e08r2n19:9033:10155 [2] NCCL INFO Channel 01 : 46[43000] -> 47[63000] via P2P/IPC comm 0x2b03ac000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 00/0 : 55[63000] -> 56[4000] [receive] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Channel 00 : 45[26000] -> 46[43000] via P2P/IPC comm 0x2af5f8000ab0 nRanks 96 e08r2n17:21282:22447 [1] NCCL INFO Channel 01 : 37[26000] -> 38[43000] via P2P/IPC comm 0x2abf00000ab0 nRanks 96 e08r3n01:6277:7260 [1] NCCL INFO Channel 00 : 53[26000] -> 54[43000] via P2P/IPC comm 0x2ba34c000ab0 nRanks 96 e08r3n00:14534:15491 [1] NCCL INFO Channel 00 : 49[26000] -> 50[43000] via P2P/IPC comm 0x2b8bd0000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Channel 00 : 42[43000] -> 43[63000] via P2P/IPC comm 0x2b2a28000ab0 nRanks 96 e08r2n17:21283:22448 [2] NCCL INFO Channel 01 : 38[43000] -> 39[63000] via P2P/IPC comm 0x2b9724000ab0 nRanks 96 e08r2n16:13444:14576 [1] NCCL INFO Channel 01 : 33[26000] -> 34[43000] via P2P/IPC comm 0x2b0180000ab0 nRanks 96 e08r3n03:22737:23845 [1] NCCL INFO Channel 01 : 61[26000] -> 62[43000] via P2P/IPC comm 0x2ac6a0000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Channel 01 : 34[43000] -> 35[63000] via P2P/IPC comm 0x2b67e4000ab0 nRanks 96 e08r3n01:6278:7261 [2] NCCL INFO Channel 01 : 54[43000] -> 55[63000] via P2P/IPC comm 0x2b101c000ab0 nRanks 96 e08r2n15:22024:23016 [2] NCCL INFO Channel 01 : 30[43000] -> 31[63000] via P2P/IPC comm 0x2b123c000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Channel 01 : 50[43000] -> 51[63000] via P2P/IPC comm 0x2baf68000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Channel 01 : 42[43000] -> 43[63000] via P2P/IPC comm 0x2b2a28000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Channel 00 : 41[26000] -> 42[43000] via P2P/IPC comm 0x2b30f4000ab0 nRanks 96 e08r3n00:14534:15491 [1] NCCL INFO Channel 01 : 49[26000] -> 50[43000] via P2P/IPC comm 0x2b8bd0000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Channel 01 : 45[26000] -> 46[43000] via P2P/IPC comm 0x2af5f8000ab0 nRanks 96 e08r3n01:6277:7260 [1] NCCL INFO Channel 01 : 53[26000] -> 54[43000] via P2P/IPC comm 0x2ba34c000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Channel 01 : 41[26000] -> 42[43000] via P2P/IPC comm 0x2b30f4000ab0 nRanks 96 e08r3n02:30403:31209 [1] NCCL INFO Channel 00 : 57[26000] -> 58[43000] via P2P/IPC comm 0x2ba198000ab0 nRanks 96 e08r3n02:30404:31213 [2] NCCL INFO Channel 00 : 58[43000] -> 59[63000] via P2P/IPC comm 0x2b67ac000ab0 nRanks 96 e08r3n02:30404:31213 [2] NCCL INFO Channel 01 : 58[43000] -> 59[63000] via P2P/IPC comm 0x2b67ac000ab0 nRanks 96 e08r3n02:30403:31209 [1] NCCL INFO Channel 01 : 57[26000] -> 58[43000] via P2P/IPC comm 0x2ba198000ab0 nRanks 96 e08r3n03:22739:23827 [3] NCCL INFO Channel 00/0 : 63[63000] -> 64[4000] [send] via NET/IB/0 comm 0x2b0524000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 01/0 : 79[63000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 00 : 80[4000] -> 81[26000] via P2P/IPC comm 0x2abcf4000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 01 : 80[4000] -> 81[26000] via P2P/IPC comm 0x2abcf4000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO Channel 00/0 : 67[63000] -> 68[4000] [send] via NET/IB/0 comm 0x2b1e28000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 01/0 : 63[63000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO Channel 00/0 : 71[63000] -> 72[4000] [send] via NET/IB/0 comm 0x2ac218000ab0 nRanks 96 e08r3n07:4893:5961 [3] NCCL INFO Channel 00/0 : 79[63000] -> 80[4000] [send] via NET/IB/0 comm 0x2ba69c000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 00 : 64[4000] -> 65[26000] via P2P/IPC comm 0x2b3574000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01/0 : 67[63000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 00 : 68[4000] -> 69[26000] via P2P/IPC comm 0x2b85d4000ab0 nRanks 96 e08r3n11:29649:30749 [3] NCCL INFO Channel 00/0 : 95[63000] -> 0[4000] [send] via NET/IB/0 comm 0x2ba6ec000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01/0 : 75[63000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r3n09:8679:9728 [3] NCCL INFO Channel 00/0 : 87[63000] -> 88[4000] [send] via NET/IB/0 comm 0x2b0c4c000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 01/0 : 91[63000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 00 : 76[4000] -> 77[26000] via P2P/IPC comm 0x2aed78000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01/0 : 83[63000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n06:22285:23335 [3] NCCL INFO Channel 00/0 : 75[63000] -> 76[4000] [send] via NET/IB/0 comm 0x2b91b4000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 00 : 92[4000] -> 93[26000] via P2P/IPC comm 0x2ac238000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 00 : 84[4000] -> 85[26000] via P2P/IPC comm 0x2b416c000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 01/0 : 71[63000] -> 72[4000] [receive] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 00 : 72[4000] -> 73[26000] via P2P/IPC comm 0x2af9e0000ab0 nRanks 96 e08r3n08:13438:14591 [3] NCCL INFO Channel 00/0 : 83[63000] -> 84[4000] [send] via NET/IB/0 comm 0x2b2614000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 01 : 64[4000] -> 65[26000] via P2P/IPC comm 0x2b3574000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01 : 68[4000] -> 69[26000] via P2P/IPC comm 0x2b85d4000ab0 nRanks 96 e08r2n08:5142:6491 [3] NCCL INFO Channel 00/0 : 3[63000] -> 4[4000] [send] via NET/IB/0 comm 0x2ad4a8000ab0 nRanks 96 e08r3n10:18788:19808 [3] NCCL INFO Channel 00/0 : 91[63000] -> 92[4000] [send] via NET/IB/0 comm 0x2ad848000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 01/0 : 87[63000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01 : 76[4000] -> 77[26000] via P2P/IPC comm 0x2aed78000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00 : 88[4000] -> 89[26000] via P2P/IPC comm 0x2af008000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 01/0 : 95[63000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 00 : 0[4000] -> 1[26000] via P2P/IPC comm 0x2b2e44000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 01 : 72[4000] -> 73[26000] via P2P/IPC comm 0x2af9e0000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01 : 84[4000] -> 85[26000] via P2P/IPC comm 0x2b416c000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 01 : 92[4000] -> 93[26000] via P2P/IPC comm 0x2ac238000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 01/0 : 7[63000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00 : 8[4000] -> 9[26000] via P2P/IPC comm 0x2b6040000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 01/0 : 3[63000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 00 : 4[4000] -> 5[26000] via P2P/IPC comm 0x2b0d1c000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 01 : 88[4000] -> 89[26000] via P2P/IPC comm 0x2af008000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 01 : 8[4000] -> 9[26000] via P2P/IPC comm 0x2b6040000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 01 : 0[4000] -> 1[26000] via P2P/IPC comm 0x2b2e44000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 01 : 4[4000] -> 5[26000] via P2P/IPC comm 0x2b0d1c000ab0 nRanks 96 e08r2n11:5734:6772 [3] NCCL INFO Channel 00/0 : 15[63000] -> 16[4000] [send] via NET/IB/0 comm 0x2b4144000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01/0 : 11[63000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 00 : 12[4000] -> 13[26000] via P2P/IPC comm 0x2b7a5c000ab0 nRanks 96 e08r2n10:876:1918 [3] NCCL INFO Channel 00/0 : 11[63000] -> 12[4000] [send] via NET/IB/0 comm 0x2b2d0c000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01/0 : 19[63000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 00 : 20[4000] -> 21[26000] via P2P/IPC comm 0x2b5014000ab0 nRanks 96 e08r2n09:27006:27966 [3] NCCL INFO Channel 00/0 : 7[63000] -> 8[4000] [send] via NET/IB/0 comm 0x2b56e4000ab0 nRanks 96 e08r2n12:8675:9665 [3] NCCL INFO Channel 00/0 : 19[63000] -> 20[4000] [send] via NET/IB/0 comm 0x2b2e18000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 01/0 : 15[63000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00 : 16[4000] -> 17[26000] via P2P/IPC comm 0x2b66f4000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01 : 12[4000] -> 13[26000] via P2P/IPC comm 0x2b7a5c000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01 : 20[4000] -> 21[26000] via P2P/IPC comm 0x2b5014000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 01 : 16[4000] -> 17[26000] via P2P/IPC comm 0x2b66f4000ab0 nRanks 96 e08r2n13:23995:25163 [3] NCCL INFO Channel 00/0 : 23[63000] -> 24[4000] [send] via NET/IB/0 comm 0x2b4b08000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01/0 : 59[63000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 00 : 60[4000] -> 61[26000] via P2P/IPC comm 0x2b4504000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Connected all rings comm 0x2b1954000ab0 nRanks 96 busId 26000 e08r2n16:13446:14609 [3] NCCL INFO Channel 00/0 : 35[63000] -> 36[4000] [send] via NET/IB/0 comm 0x2abfb8000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 01/0 : 55[63000] -> 56[4000] [receive] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 01/0 : 31[63000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00 : 32[4000] -> 33[26000] via P2P/IPC comm 0x2b4aa4000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 00 : 56[4000] -> 57[26000] via P2P/IPC comm 0x2bab5c000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Connected all rings comm 0x2b4344000ab0 nRanks 96 busId 26000 e08r2n15:22025:23017 [3] NCCL INFO Channel 00/0 : 31[63000] -> 32[4000] [send] via NET/IB/0 comm 0x2b3208000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01/0 : 27[63000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 00 : 28[4000] -> 29[26000] via P2P/IPC comm 0x2b5d18000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01 : 60[4000] -> 61[26000] via P2P/IPC comm 0x2b4504000ab0 nRanks 96 e08r3n11:29647:30751 [1] NCCL INFO Connected all rings comm 0x2abd10000ab0 nRanks 96 busId 26000 e08r3n08:13436:14594 [1] NCCL INFO Channel 00/0 : 72[4000] -> 81[26000] [receive] via NET/IB/0 comm 0x2b1954000ab0 nRanks 96 e08r2n17:21284:22443 [3] NCCL INFO Channel 00/0 : 39[63000] -> 40[4000] [send] via NET/IB/0 comm 0x2ba520000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Connected all rings comm 0x2ab9d4000ab0 nRanks 96 busId 26000 e08r2n14:18196:19160 [3] NCCL INFO Channel 00/0 : 27[63000] -> 28[4000] [send] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 01/0 : 35[63000] -> 36[4000] [receive] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 01 : 56[4000] -> 57[26000] via P2P/IPC comm 0x2bab5c000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Connected all rings comm 0x2b7a94000ab0 nRanks 96 busId 26000 e08r2n14:18192:19156 [0] NCCL INFO Channel 01/0 : 23[63000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 00 : 36[4000] -> 37[26000] via P2P/IPC comm 0x2aff88000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Connected all rings comm 0x2ac35c000ab0 nRanks 96 busId 26000 e08r2n16:13442:14572 [0] NCCL INFO Channel 01 : 32[4000] -> 33[26000] via P2P/IPC comm 0x2b4aa4000ab0 nRanks 96 e08r2n18:755:1882 [3] NCCL INFO Channel 00/0 : 43[63000] -> 44[4000] [send] via NET/IB/0 comm 0x2b7fac000ab0 nRanks 96 e08r3n01:6279:7255 [3] NCCL INFO Channel 00/0 : 55[63000] -> 56[4000] [send] via NET/IB/0 comm 0x2aea58000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Connected all rings comm 0x2b0b78000ab0 nRanks 96 busId 26000 e08r2n14:18192:19156 [0] NCCL INFO Channel 00 : 24[4000] -> 25[26000] via P2P/IPC comm 0x2b88b4000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 01/0 : 39[63000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01/0 : 51[63000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 00 : 52[4000] -> 53[26000] via P2P/IPC comm 0x2b8738000ab0 nRanks 96 e08r2n19:9034:10156 [3] NCCL INFO Channel 00/0 : 47[63000] -> 48[4000] [send] via NET/IB/0 comm 0x2b6940000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Channel 01/0 : 85[26000] -> 88[4000] [send] via NET/IB/0 comm 0x2b4344000ab0 nRanks 96 e08r3n00:14536:15487 [3] NCCL INFO Channel 00/0 : 51[63000] -> 52[4000] [send] via NET/IB/0 comm 0x2b7774000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Connected all rings comm 0x2b9a88000ab0 nRanks 96 busId 26000 e08r2n18:751:1877 [0] NCCL INFO Channel 00 : 40[4000] -> 41[26000] via P2P/IPC comm 0x2b8134000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 01/0 : 43[63000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 01/0 : 47[63000] -> 48[4000] [receive] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01 : 28[4000] -> 29[26000] via P2P/IPC comm 0x2b5d18000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 00 : 44[4000] -> 45[26000] via P2P/IPC comm 0x2ab408000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 00 : 48[4000] -> 49[26000] via P2P/IPC comm 0x2abe48000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Channel 01/0 : 69[26000] -> 72[4000] [send] via NET/IB/0 comm 0x2ab9d4000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 01/0 : 77[26000] -> 84[4000] [send] via NET/IB/0 comm 0x2b7a94000ab0 nRanks 96 e08r2n09:27004:27956 [1] NCCL INFO Connected all rings comm 0x2af6e0000ab0 nRanks 96 busId 26000 e08r2n18:751:1877 [0] NCCL INFO Channel 01 : 40[4000] -> 41[26000] via P2P/IPC comm 0x2b8134000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 01 : 24[4000] -> 25[26000] via P2P/IPC comm 0x2b88b4000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01 : 52[4000] -> 53[26000] via P2P/IPC comm 0x2b8738000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 01 : 36[4000] -> 37[26000] via P2P/IPC comm 0x2aff88000ab0 nRanks 96 e08r3n02:30405:31208 [3] NCCL INFO Channel 00/0 : 59[63000] -> 60[4000] [send] via NET/IB/0 comm 0x2b6924000ab0 nRanks 96 e08r3n11:29647:30751 [1] NCCL INFO Channel 00 : 93[26000] -> 92[4000] via P2P/IPC comm 0x2abd10000ab0 nRanks 96 e08r2n08:5140:6524 [1] NCCL INFO Connected all rings comm 0x2b30cc000ab0 nRanks 96 busId 26000 e08r2n10:874:1920 [1] NCCL INFO Connected all rings comm 0x2b1f10000ab0 nRanks 96 busId 26000 e08r2n19:9030:10143 [0] NCCL INFO Channel 01 : 44[4000] -> 45[26000] via P2P/IPC comm 0x2ab408000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 00/0 : 84[4000] -> 89[26000] [receive] via NET/IB/0 comm 0x2ac35c000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 00/0 : 32[4000] -> 65[26000] [receive] via NET/IB/0 comm 0x2b0b78000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 01 : 48[4000] -> 49[26000] via P2P/IPC comm 0x2abe48000ab0 nRanks 96 e08r3n11:29647:30751 [1] NCCL INFO Channel 01 : 93[26000] -> 92[4000] via P2P/IPC comm 0x2abd10000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Channel 00/0 : 68[4000] -> 73[26000] [receive] via NET/IB/0 comm 0x2b9a88000ab0 nRanks 96 e08r2n09:27004:27956 [1] NCCL INFO Channel 01/0 : 5[26000] -> 8[4000] [send] via NET/IB/0 comm 0x2af6e0000ab0 nRanks 96 e08r2n10:874:1920 [1] NCCL INFO Channel 00/0 : 4[4000] -> 9[26000] [receive] via NET/IB/0 comm 0x2b1f10000ab0 nRanks 96 e08r2n08:5140:6524 [1] NCCL INFO Channel 00 : 1[26000] -> 0[4000] via P2P/IPC comm 0x2b30cc000ab0 nRanks 96 e08r2n08:5140:6524 [1] NCCL INFO Channel 01 : 1[26000] -> 0[4000] via P2P/IPC comm 0x2b30cc000ab0 nRanks 96 e08r2n11:5732:6769 [1] NCCL INFO Connected all rings comm 0x2b11a0000ab0 nRanks 96 busId 26000 e08r2n13:23993:25161 [1] NCCL INFO Connected all rings comm 0x2b4058000ab0 nRanks 96 busId 26000 e08r2n12:8673:9656 [1] NCCL INFO Connected all rings comm 0x2b92b8000ab0 nRanks 96 busId 26000 e08r2n11:5732:6769 [1] NCCL INFO Channel 01/0 : 13[26000] -> 20[4000] [send] via NET/IB/0 comm 0x2b11a0000ab0 nRanks 96 e08r2n13:23993:25161 [1] NCCL INFO Channel 01/0 : 21[26000] -> 24[4000] [send] via NET/IB/0 comm 0x2b4058000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 00/0 : 8[4000] -> 17[26000] [receive] via NET/IB/0 comm 0x2b92b8000ab0 nRanks 96 e08r3n03:22737:23845 [1] NCCL INFO Connected all rings comm 0x2ac6a0000ab0 nRanks 96 busId 26000 e08r3n02:30403:31209 [1] NCCL INFO Connected all rings comm 0x2ba198000ab0 nRanks 96 busId 26000 e08r2n16:13444:14576 [1] NCCL INFO Connected all rings comm 0x2b0180000ab0 nRanks 96 busId 26000 e08r3n01:6277:7260 [1] NCCL INFO Connected all rings comm 0x2ba34c000ab0 nRanks 96 busId 26000 e08r2n15:22023:23011 [1] NCCL INFO Connected all rings comm 0x2ad4b8000ab0 nRanks 96 busId 26000 e08r3n03:22737:23845 [1] NCCL INFO Channel 01/0 : 61[26000] -> 76[4000] [send] via NET/IB/0 comm 0x2ac6a0000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Connected all rings comm 0x2b43b4000ab0 nRanks 96 busId 26000 e08r2n18:753:1883 [1] NCCL INFO Connected all rings comm 0x2b30f4000ab0 nRanks 96 busId 26000 e08r3n02:30403:31209 [1] NCCL INFO Channel 00/0 : 52[4000] -> 57[26000] [receive] via NET/IB/0 comm 0x2ba198000ab0 nRanks 96 e08r2n17:21282:22447 [1] NCCL INFO Connected all rings comm 0x2abf00000ab0 nRanks 96 busId 26000 e08r3n01:6277:7260 [1] NCCL INFO Channel 01/0 : 53[26000] -> 56[4000] [send] via NET/IB/0 comm 0x2ba34c000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Connected all rings comm 0x2af5f8000ab0 nRanks 96 busId 26000 e08r2n16:13444:14576 [1] NCCL INFO Channel 00/0 : 16[4000] -> 33[26000] [receive] via NET/IB/0 comm 0x2b0180000ab0 nRanks 96 e08r2n15:22023:23011 [1] NCCL INFO Channel 01/0 : 29[26000] -> 60[4000] [send] via NET/IB/0 comm 0x2ad4b8000ab0 nRanks 96 e08r3n00:14534:15491 [1] NCCL INFO Connected all rings comm 0x2b8bd0000ab0 nRanks 96 busId 26000 e08r2n17:21282:22447 [1] NCCL INFO Channel 01/0 : 37[26000] -> 40[4000] [send] via NET/IB/0 comm 0x2abf00000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 00/0 : 20[4000] -> 25[26000] [receive] via NET/IB/0 comm 0x2b43b4000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Channel 00/0 : 36[4000] -> 41[26000] [receive] via NET/IB/0 comm 0x2b30f4000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Channel 01/0 : 45[26000] -> 52[4000] [send] via NET/IB/0 comm 0x2af5f8000ab0 nRanks 96 e08r3n00:14534:15491 [1] NCCL INFO Channel 00/0 : 40[4000] -> 49[26000] [receive] via NET/IB/0 comm 0x2b8bd0000ab0 nRanks 96 e08r3n03:22739:23827 [3] NCCL INFO Channel 01/0 : 63[63000] -> 64[4000] [send] via NET/IB/0 comm 0x2b0524000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO Channel 01/0 : 67[63000] -> 68[4000] [send] via NET/IB/0 comm 0x2b1e28000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO Channel 01/0 : 71[63000] -> 72[4000] [send] via NET/IB/0 comm 0x2ac218000ab0 nRanks 96 e08r3n07:4893:5961 [3] NCCL INFO Channel 01/0 : 79[63000] -> 80[4000] [send] via NET/IB/0 comm 0x2ba69c000ab0 nRanks 96 e08r3n09:8679:9728 [3] NCCL INFO Channel 01/0 : 87[63000] -> 88[4000] [send] via NET/IB/0 comm 0x2b0c4c000ab0 nRanks 96 e08r3n11:29649:30749 [3] NCCL INFO Channel 01/0 : 95[63000] -> 0[4000] [send] via NET/IB/0 comm 0x2ba6ec000ab0 nRanks 96 e08r3n06:22285:23335 [3] NCCL INFO Channel 01/0 : 75[63000] -> 76[4000] [send] via NET/IB/0 comm 0x2b91b4000ab0 nRanks 96 e08r3n08:13438:14591 [3] NCCL INFO Channel 01/0 : 83[63000] -> 84[4000] [send] via NET/IB/0 comm 0x2b2614000ab0 nRanks 96 e08r2n08:5142:6491 [3] NCCL INFO Channel 01/0 : 3[63000] -> 4[4000] [send] via NET/IB/0 comm 0x2ad4a8000ab0 nRanks 96 e08r3n10:18788:19808 [3] NCCL INFO Channel 01/0 : 91[63000] -> 92[4000] [send] via NET/IB/0 comm 0x2ad848000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Connected all rings comm 0x2af43c000ab0 nRanks 96 busId 43000 e08r2n11:5734:6772 [3] NCCL INFO Channel 01/0 : 15[63000] -> 16[4000] [send] via NET/IB/0 comm 0x2b4144000ab0 nRanks 96 e08r2n10:876:1918 [3] NCCL INFO Channel 01/0 : 11[63000] -> 12[4000] [send] via NET/IB/0 comm 0x2b2d0c000ab0 nRanks 96 e08r2n09:27006:27966 [3] NCCL INFO Channel 01/0 : 7[63000] -> 8[4000] [send] via NET/IB/0 comm 0x2b56e4000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Channel 00 : 62[43000] -> 61[26000] via P2P/IPC comm 0x2af43c000ab0 nRanks 96 e08r2n12:8675:9665 [3] NCCL INFO Channel 01/0 : 19[63000] -> 20[4000] [send] via NET/IB/0 comm 0x2b2e18000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Channel 01 : 62[43000] -> 61[26000] via P2P/IPC comm 0x2af43c000ab0 nRanks 96 e08r3n11:29648:30753 [2] NCCL INFO Connected all rings comm 0x2b8da8000ab0 nRanks 96 busId 43000 e08r3n04:16939:17749 [2] NCCL INFO Connected all rings comm 0x2b4eb4000ab0 nRanks 96 busId 43000 e08r3n07:4892:5963 [2] NCCL INFO Connected all rings comm 0x2b9670000ab0 nRanks 96 busId 43000 e08r3n05:24734:25804 [2] NCCL INFO Connected all rings comm 0x2b26b0000ab0 nRanks 96 busId 43000 e08r3n09:8678:9738 [2] NCCL INFO Connected all rings comm 0x2b20f8000ab0 nRanks 96 busId 43000 e08r3n10:18787:19820 [2] NCCL INFO Connected all rings comm 0x2ae6c4000ab0 nRanks 96 busId 43000 e08r3n06:22284:23338 [2] NCCL INFO Connected all rings comm 0x2b141c000ab0 nRanks 96 busId 43000 e08r2n13:23995:25163 [3] NCCL INFO Channel 01/0 : 23[63000] -> 24[4000] [send] via NET/IB/0 comm 0x2b4b08000ab0 nRanks 96 e08r3n11:29648:30753 [2] NCCL INFO Channel 00 : 94[43000] -> 93[26000] via P2P/IPC comm 0x2b8da8000ab0 nRanks 96 e08r2n16:13446:14609 [3] NCCL INFO Channel 01/0 : 35[63000] -> 36[4000] [send] via NET/IB/0 comm 0x2abfb8000ab0 nRanks 96 e08r3n05:24734:25804 [2] NCCL INFO Channel 00 : 70[43000] -> 69[26000] via P2P/IPC comm 0x2b26b0000ab0 nRanks 96 e08r2n08:5141:6541 [2] NCCL INFO Connected all rings comm 0x2b5bd8000ab0 nRanks 96 busId 43000 e08r3n07:4892:5963 [2] NCCL INFO Channel 00 : 78[43000] -> 77[26000] via P2P/IPC comm 0x2b9670000ab0 nRanks 96 e08r3n11:29648:30753 [2] NCCL INFO Channel 01 : 94[43000] -> 93[26000] via P2P/IPC comm 0x2b8da8000ab0 nRanks 96 e08r3n08:13437:14595 [2] NCCL INFO Connected all rings comm 0x2b8f38000ab0 nRanks 96 busId 43000 e08r2n15:22025:23017 [3] NCCL INFO Channel 01/0 : 31[63000] -> 32[4000] [send] via NET/IB/0 comm 0x2b3208000ab0 nRanks 96 e08r3n04:16939:17749 [2] NCCL INFO Channel 00 : 66[43000] -> 65[26000] via P2P/IPC comm 0x2b4eb4000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO Channel 00 : 74[43000] -> 73[26000] via P2P/IPC comm 0x2b141c000ab0 nRanks 96 e08r2n14:18196:19160 [3] NCCL INFO Channel 01/0 : 27[63000] -> 28[4000] [send] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r3n09:8678:9738 [2] NCCL INFO Channel 00 : 86[43000] -> 85[26000] via P2P/IPC comm 0x2b20f8000ab0 nRanks 96 e08r3n10:18787:19820 [2] NCCL INFO Channel 00 : 90[43000] -> 89[26000] via P2P/IPC comm 0x2ae6c4000ab0 nRanks 96 e08r3n07:4892:5963 [2] NCCL INFO Channel 01 : 78[43000] -> 77[26000] via P2P/IPC comm 0x2b9670000ab0 nRanks 96 e08r2n17:21284:22443 [3] NCCL INFO Channel 01/0 : 39[63000] -> 40[4000] [send] via NET/IB/0 comm 0x2ba520000ab0 nRanks 96 e08r3n04:16939:17749 [2] NCCL INFO Channel 01 : 66[43000] -> 65[26000] via P2P/IPC comm 0x2b4eb4000ab0 nRanks 96 e08r3n05:24734:25804 [2] NCCL INFO Channel 01 : 70[43000] -> 69[26000] via P2P/IPC comm 0x2b26b0000ab0 nRanks 96 e08r2n18:755:1882 [3] NCCL INFO Channel 01/0 : 43[63000] -> 44[4000] [send] via NET/IB/0 comm 0x2b7fac000ab0 nRanks 96 e08r3n01:6279:7255 [3] NCCL INFO Channel 01/0 : 55[63000] -> 56[4000] [send] via NET/IB/0 comm 0x2aea58000ab0 nRanks 96 e08r2n19:9034:10156 [3] NCCL INFO Channel 01/0 : 47[63000] -> 48[4000] [send] via NET/IB/0 comm 0x2b6940000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO Channel 01 : 74[43000] -> 73[26000] via P2P/IPC comm 0x2b141c000ab0 nRanks 96 e08r3n09:8678:9738 [2] NCCL INFO Channel 01 : 86[43000] -> 85[26000] via P2P/IPC comm 0x2b20f8000ab0 nRanks 96 e08r3n00:14536:15487 [3] NCCL INFO Channel 01/0 : 51[63000] -> 52[4000] [send] via NET/IB/0 comm 0x2b7774000ab0 nRanks 96 e08r3n10:18787:19820 [2] NCCL INFO Channel 01 : 90[43000] -> 89[26000] via P2P/IPC comm 0x2ae6c4000ab0 nRanks 96 e08r2n08:5141:6541 [2] NCCL INFO Channel 00 : 2[43000] -> 1[26000] via P2P/IPC comm 0x2b5bd8000ab0 nRanks 96 e08r3n08:13437:14595 [2] NCCL INFO Channel 00 : 82[43000] -> 81[26000] via P2P/IPC comm 0x2b8f38000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO Connected all rings comm 0x2b65a0000ab0 nRanks 96 busId 43000 e08r3n02:30405:31208 [3] NCCL INFO Channel 01/0 : 59[63000] -> 60[4000] [send] via NET/IB/0 comm 0x2b6924000ab0 nRanks 96 e08r2n08:5141:6541 [2] NCCL INFO Channel 01 : 2[43000] -> 1[26000] via P2P/IPC comm 0x2b5bd8000ab0 nRanks 96 e08r3n08:13437:14595 [2] NCCL INFO Channel 01 : 82[43000] -> 81[26000] via P2P/IPC comm 0x2b8f38000ab0 nRanks 96 e08r2n11:5733:6773 [2] NCCL INFO Connected all rings comm 0x2ae6f0000ab0 nRanks 96 busId 43000 e08r2n10:875:1919 [2] NCCL INFO Connected all rings comm 0x2af8c4000ab0 nRanks 96 busId 43000 e08r2n09:27005:27965 [2] NCCL INFO Connected all rings comm 0x2b3e48000ab0 nRanks 96 busId 43000 e08r2n12:8674:9663 [2] NCCL INFO Channel 00 : 18[43000] -> 17[26000] via P2P/IPC comm 0x2b65a0000ab0 nRanks 96 e08r2n11:5733:6773 [2] NCCL INFO Channel 00 : 14[43000] -> 13[26000] via P2P/IPC comm 0x2ae6f0000ab0 nRanks 96 e08r2n10:875:1919 [2] NCCL INFO Channel 00 : 10[43000] -> 9[26000] via P2P/IPC comm 0x2af8c4000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO Channel 01 : 18[43000] -> 17[26000] via P2P/IPC comm 0x2b65a0000ab0 nRanks 96 e08r2n10:875:1919 [2] NCCL INFO Channel 01 : 10[43000] -> 9[26000] via P2P/IPC comm 0x2af8c4000ab0 nRanks 96 e08r2n11:5733:6773 [2] NCCL INFO Channel 01 : 14[43000] -> 13[26000] via P2P/IPC comm 0x2ae6f0000ab0 nRanks 96 e08r2n09:27005:27965 [2] NCCL INFO Channel 00 : 6[43000] -> 5[26000] via P2P/IPC comm 0x2b3e48000ab0 nRanks 96 e08r2n13:23994:25164 [2] NCCL INFO Connected all rings comm 0x2b5d8c000ab0 nRanks 96 busId 43000 e08r2n09:27005:27965 [2] NCCL INFO Channel 01 : 6[43000] -> 5[26000] via P2P/IPC comm 0x2b3e48000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Connected all rings comm 0x2b67e4000ab0 nRanks 96 busId 43000 e08r3n01:6278:7261 [2] NCCL INFO Connected all rings comm 0x2b101c000ab0 nRanks 96 busId 43000 e08r2n17:21283:22448 [2] NCCL INFO Connected all rings comm 0x2b9724000ab0 nRanks 96 busId 43000 e08r2n15:22024:23016 [2] NCCL INFO Connected all rings comm 0x2b123c000ab0 nRanks 96 busId 43000 e08r2n13:23994:25164 [2] NCCL INFO Channel 00 : 22[43000] -> 21[26000] via P2P/IPC comm 0x2b5d8c000ab0 nRanks 96 e08r2n14:18195:19161 [2] NCCL INFO Connected all rings comm 0x2b74c4000ab0 nRanks 96 busId 43000 e08r2n19:9033:10155 [2] NCCL INFO Connected all rings comm 0x2b03ac000ab0 nRanks 96 busId 43000 e08r2n13:23994:25164 [2] NCCL INFO Channel 01 : 22[43000] -> 21[26000] via P2P/IPC comm 0x2b5d8c000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Connected all rings comm 0x2b2a28000ab0 nRanks 96 busId 43000 e08r3n00:14535:15492 [2] NCCL INFO Connected all rings comm 0x2baf68000ab0 nRanks 96 busId 43000 e08r2n16:13445:14603 [2] NCCL INFO Channel 00 : 34[43000] -> 33[26000] via P2P/IPC comm 0x2b67e4000ab0 nRanks 96 e08r3n01:6278:7261 [2] NCCL INFO Channel 00 : 54[43000] -> 53[26000] via P2P/IPC comm 0x2b101c000ab0 nRanks 96 e08r3n02:30404:31213 [2] NCCL INFO Connected all rings comm 0x2b67ac000ab0 nRanks 96 busId 43000 e08r2n17:21283:22448 [2] NCCL INFO Channel 00 : 38[43000] -> 37[26000] via P2P/IPC comm 0x2b9724000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Channel 01 : 34[43000] -> 33[26000] via P2P/IPC comm 0x2b67e4000ab0 nRanks 96 e08r2n15:22024:23016 [2] NCCL INFO Channel 00 : 30[43000] -> 29[26000] via P2P/IPC comm 0x2b123c000ab0 nRanks 96 e08r2n19:9033:10155 [2] NCCL INFO Channel 00 : 46[43000] -> 45[26000] via P2P/IPC comm 0x2b03ac000ab0 nRanks 96 e08r3n01:6278:7261 [2] NCCL INFO Channel 01 : 54[43000] -> 53[26000] via P2P/IPC comm 0x2b101c000ab0 nRanks 96 e08r2n17:21283:22448 [2] NCCL INFO Channel 01 : 38[43000] -> 37[26000] via P2P/IPC comm 0x2b9724000ab0 nRanks 96 e08r2n14:18195:19161 [2] NCCL INFO Channel 00 : 26[43000] -> 25[26000] via P2P/IPC comm 0x2b74c4000ab0 nRanks 96 e08r2n15:22024:23016 [2] NCCL INFO Channel 01 : 30[43000] -> 29[26000] via P2P/IPC comm 0x2b123c000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Channel 00 : 50[43000] -> 49[26000] via P2P/IPC comm 0x2baf68000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Channel 00 : 42[43000] -> 41[26000] via P2P/IPC comm 0x2b2a28000ab0 nRanks 96 e08r2n14:18195:19161 [2] NCCL INFO Channel 01 : 26[43000] -> 25[26000] via P2P/IPC comm 0x2b74c4000ab0 nRanks 96 e08r3n02:30404:31213 [2] NCCL INFO Channel 00 : 58[43000] -> 57[26000] via P2P/IPC comm 0x2b67ac000ab0 nRanks 96 e08r2n19:9033:10155 [2] NCCL INFO Channel 01 : 46[43000] -> 45[26000] via P2P/IPC comm 0x2b03ac000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Channel 01 : 42[43000] -> 41[26000] via P2P/IPC comm 0x2b2a28000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Channel 01 : 50[43000] -> 49[26000] via P2P/IPC comm 0x2baf68000ab0 nRanks 96 e08r3n02:30404:31213 [2] NCCL INFO Channel 01 : 58[43000] -> 57[26000] via P2P/IPC comm 0x2b67ac000ab0 nRanks 96 e08r3n03:22739:23827 [3] NCCL INFO Connected all rings comm 0x2b0524000ab0 nRanks 96 busId 63000 e08r3n03:22739:23827 [3] NCCL INFO Channel 00 : 63[63000] -> 62[43000] via P2P/IPC comm 0x2b0524000ab0 nRanks 96 e08r3n03:22739:23827 [3] NCCL INFO Channel 01 : 63[63000] -> 62[43000] via P2P/IPC comm 0x2b0524000ab0 nRanks 96 e08r3n08:13438:14591 [3] NCCL INFO Connected all rings comm 0x2b2614000ab0 nRanks 96 busId 63000 e08r3n08:13438:14591 [3] NCCL INFO Channel 00 : 83[63000] -> 82[43000] via P2P/IPC comm 0x2b2614000ab0 nRanks 96 e08r3n08:13438:14591 [3] NCCL INFO Channel 01 : 83[63000] -> 82[43000] via P2P/IPC comm 0x2b2614000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO Connected all rings comm 0x2ac218000ab0 nRanks 96 busId 63000 e08r3n05:24735:25797 [3] NCCL INFO Channel 00 : 71[63000] -> 70[43000] via P2P/IPC comm 0x2ac218000ab0 nRanks 96 e08r3n07:4893:5961 [3] NCCL INFO Connected all rings comm 0x2ba69c000ab0 nRanks 96 busId 63000 e08r3n07:4893:5961 [3] NCCL INFO Channel 00 : 79[63000] -> 78[43000] via P2P/IPC comm 0x2ba69c000ab0 nRanks 96 e08r2n08:5142:6491 [3] NCCL INFO Connected all rings comm 0x2ad4a8000ab0 nRanks 96 busId 63000 e08r2n08:5142:6491 [3] NCCL INFO Channel 00 : 3[63000] -> 2[43000] via P2P/IPC comm 0x2ad4a8000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO Channel 01 : 71[63000] -> 70[43000] via P2P/IPC comm 0x2ac218000ab0 nRanks 96 e08r3n11:29649:30749 [3] NCCL INFO Connected all rings comm 0x2ba6ec000ab0 nRanks 96 busId 63000 e08r3n07:4893:5961 [3] NCCL INFO Channel 01 : 79[63000] -> 78[43000] via P2P/IPC comm 0x2ba69c000ab0 nRanks 96 e08r2n08:5142:6491 [3] NCCL INFO Channel 01 : 3[63000] -> 2[43000] via P2P/IPC comm 0x2ad4a8000ab0 nRanks 96 e08r3n11:29649:30749 [3] NCCL INFO Channel 00 : 95[63000] -> 94[43000] via P2P/IPC comm 0x2ba6ec000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO Connected all rings comm 0x2b1e28000ab0 nRanks 96 busId 63000 e08r3n04:16940:17743 [3] NCCL INFO Channel 00 : 67[63000] -> 66[43000] via P2P/IPC comm 0x2b1e28000ab0 nRanks 96 e08r3n09:8679:9728 [3] NCCL INFO Connected all rings comm 0x2b0c4c000ab0 nRanks 96 busId 63000 e08r3n09:8679:9728 [3] NCCL INFO Channel 00 : 87[63000] -> 86[43000] via P2P/IPC comm 0x2b0c4c000ab0 nRanks 96 e08r3n11:29649:30749 [3] NCCL INFO Channel 01 : 95[63000] -> 94[43000] via P2P/IPC comm 0x2ba6ec000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO Channel 01 : 67[63000] -> 66[43000] via P2P/IPC comm 0x2b1e28000ab0 nRanks 96 e08r3n09:8679:9728 [3] NCCL INFO Channel 01 : 87[63000] -> 86[43000] via P2P/IPC comm 0x2b0c4c000ab0 nRanks 96 e08r3n03:22739:23827 [3] NCCL INFO Connected all trees comm 0x2b0524000ab0 nRanks 96 busId 63000 e08r3n03:22739:23827 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22739:23827 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8675:9665 [3] NCCL INFO Connected all rings comm 0x2b2e18000ab0 nRanks 96 busId 63000 e08r2n12:8675:9665 [3] NCCL INFO Channel 00 : 19[63000] -> 18[43000] via P2P/IPC comm 0x2b2e18000ab0 nRanks 96 e08r2n10:876:1918 [3] NCCL INFO Connected all rings comm 0x2b2d0c000ab0 nRanks 96 busId 63000 e08r3n06:22285:23335 [3] NCCL INFO Connected all rings comm 0x2b91b4000ab0 nRanks 96 busId 63000 e08r2n10:876:1918 [3] NCCL INFO Channel 00 : 11[63000] -> 10[43000] via P2P/IPC comm 0x2b2d0c000ab0 nRanks 96 e08r3n06:22285:23335 [3] NCCL INFO Channel 00 : 75[63000] -> 74[43000] via P2P/IPC comm 0x2b91b4000ab0 nRanks 96 e08r2n12:8675:9665 [3] NCCL INFO Channel 01 : 19[63000] -> 18[43000] via P2P/IPC comm 0x2b2e18000ab0 nRanks 96 e08r3n08:13438:14591 [3] NCCL INFO Connected all trees comm 0x2b2614000ab0 nRanks 96 busId 63000 e08r3n04:16936:17745 [0] NCCL INFO Connected all rings comm 0x2b3574000ab0 nRanks 96 busId 4000 e08r3n08:13438:14591 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13438:14591 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:876:1918 [3] NCCL INFO Channel 01 : 11[63000] -> 10[43000] via P2P/IPC comm 0x2b2d0c000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO Connected all trees comm 0x2ac218000ab0 nRanks 96 busId 63000 e08r3n10:18788:19808 [3] NCCL INFO Connected all rings comm 0x2ad848000ab0 nRanks 96 busId 63000 e08r3n06:22285:23335 [3] NCCL INFO Channel 01 : 75[63000] -> 74[43000] via P2P/IPC comm 0x2b91b4000ab0 nRanks 96 e08r3n10:18788:19808 [3] NCCL INFO Channel 00 : 91[63000] -> 90[43000] via P2P/IPC comm 0x2ad848000ab0 nRanks 96 e08r3n05:24735:25797 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24735:25797 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5136:6335 [0] NCCL INFO Connected all rings comm 0x2b2e44000ab0 nRanks 96 busId 4000 e08r3n07:4893:5961 [3] NCCL INFO Connected all trees comm 0x2ba69c000ab0 nRanks 96 busId 63000 e08r3n08:13434:14586 [0] NCCL INFO Connected all rings comm 0x2abcf4000ab0 nRanks 96 busId 4000 e08r3n07:4893:5961 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22281:23330 [0] NCCL INFO Connected all rings comm 0x2af9e0000ab0 nRanks 96 busId 4000 e08r3n07:4893:5961 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5141:6541 [2] NCCL INFO Connected all trees comm 0x2b5bd8000ab0 nRanks 96 busId 43000 e08r3n11:29649:30749 [3] NCCL INFO Connected all trees comm 0x2ba6ec000ab0 nRanks 96 busId 63000 e08r3n10:18788:19808 [3] NCCL INFO Channel 01 : 91[63000] -> 90[43000] via P2P/IPC comm 0x2ad848000ab0 nRanks 96 e08r2n08:5141:6541 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5141:6541 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27006:27966 [3] NCCL INFO Connected all rings comm 0x2b56e4000ab0 nRanks 96 busId 63000 e08r3n11:29649:30749 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29649:30749 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5142:6491 [3] NCCL INFO Connected all trees comm 0x2ad4a8000ab0 nRanks 96 busId 63000 e08r2n09:27006:27966 [3] NCCL INFO Channel 00 : 7[63000] -> 6[43000] via P2P/IPC comm 0x2b56e4000ab0 nRanks 96 e08r2n08:5142:6491 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5142:6491 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8675:9723 [0] NCCL INFO Connected all rings comm 0x2b416c000ab0 nRanks 96 busId 4000 e08r3n11:29648:30753 [2] NCCL INFO Connected all trees comm 0x2b8da8000ab0 nRanks 96 busId 43000 e08r3n05:24731:25791 [0] NCCL INFO Connected all rings comm 0x2b85d4000ab0 nRanks 96 busId 4000 e08r3n11:29648:30753 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29648:30753 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8679:9728 [3] NCCL INFO Connected all trees comm 0x2b0c4c000ab0 nRanks 96 busId 63000 e08r2n09:27006:27966 [3] NCCL INFO Channel 01 : 7[63000] -> 6[43000] via P2P/IPC comm 0x2b56e4000ab0 nRanks 96 e08r3n09:8679:9728 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5734:6772 [3] NCCL INFO Connected all rings comm 0x2b4144000ab0 nRanks 96 busId 63000 e08r2n16:13446:14609 [3] NCCL INFO Connected all rings comm 0x2abfb8000ab0 nRanks 96 busId 63000 e08r3n09:8679:9728 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5734:6772 [3] NCCL INFO Channel 00 : 15[63000] -> 14[43000] via P2P/IPC comm 0x2b4144000ab0 nRanks 96 e08r2n16:13446:14609 [3] NCCL INFO Channel 00 : 35[63000] -> 34[43000] via P2P/IPC comm 0x2abfb8000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO Connected all trees comm 0x2b1e28000ab0 nRanks 96 busId 63000 e08r3n04:16940:17743 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16940:17743 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13446:14609 [3] NCCL INFO Channel 01 : 35[63000] -> 34[43000] via P2P/IPC comm 0x2abfb8000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Connected all rings comm 0x2aed78000ab0 nRanks 96 busId 4000 e08r2n14:18196:19160 [3] NCCL INFO Connected all rings comm 0x2ab5e8000ab0 nRanks 96 busId 63000 e08r2n14:18196:19160 [3] NCCL INFO Channel 00 : 27[63000] -> 26[43000] via P2P/IPC comm 0x2ab5e8000ab0 nRanks 96 e08r2n11:5734:6772 [3] NCCL INFO Channel 01 : 15[63000] -> 14[43000] via P2P/IPC comm 0x2b4144000ab0 nRanks 96 e08r2n19:9034:10156 [3] NCCL INFO Connected all rings comm 0x2b6940000ab0 nRanks 96 busId 63000 e08r2n12:8675:9665 [3] NCCL INFO Connected all trees comm 0x2b2e18000ab0 nRanks 96 busId 63000 e08r2n19:9034:10156 [3] NCCL INFO Channel 00 : 47[63000] -> 46[43000] via P2P/IPC comm 0x2b6940000ab0 nRanks 96 e08r3n00:14536:15487 [3] NCCL INFO Connected all rings comm 0x2b7774000ab0 nRanks 96 busId 63000 e08r3n00:14536:15487 [3] NCCL INFO Channel 00 : 51[63000] -> 50[43000] via P2P/IPC comm 0x2b7774000ab0 nRanks 96 e08r2n12:8675:9665 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8675:9665 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5730:6763 [0] NCCL INFO Connected all rings comm 0x2b7a5c000ab0 nRanks 96 busId 4000 e08r3n11:29645:30741 [0] NCCL INFO Connected all rings comm 0x2ac238000ab0 nRanks 96 busId 4000 e08r2n14:18196:19160 [3] NCCL INFO Channel 01 : 27[63000] -> 26[43000] via P2P/IPC comm 0x2ab5e8000ab0 nRanks 96 e08r2n10:876:1918 [3] NCCL INFO Connected all trees comm 0x2b2d0c000ab0 nRanks 96 busId 63000 e08r2n09:27002:27953 [0] NCCL INFO Connected all rings comm 0x2b0d1c000ab0 nRanks 96 busId 4000 e08r2n10:876:1918 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:876:1918 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23995:25163 [3] NCCL INFO Connected all rings comm 0x2b4b08000ab0 nRanks 96 busId 63000 e08r3n06:22285:23335 [3] NCCL INFO Connected all trees comm 0x2b91b4000ab0 nRanks 96 busId 63000 e08r2n13:23995:25163 [3] NCCL INFO Channel 00 : 23[63000] -> 22[43000] via P2P/IPC comm 0x2b4b08000ab0 nRanks 96 e08r3n06:22285:23335 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22285:23335 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9034:10156 [3] NCCL INFO Channel 01 : 47[63000] -> 46[43000] via P2P/IPC comm 0x2b6940000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Connected all rings comm 0x2b6040000ab0 nRanks 96 busId 4000 e08r2n17:21284:22443 [3] NCCL INFO Connected all rings comm 0x2ba520000ab0 nRanks 96 busId 63000 e08r3n01:6279:7255 [3] NCCL INFO Connected all rings comm 0x2aea58000ab0 nRanks 96 busId 63000 e08r2n17:21284:22443 [3] NCCL INFO Channel 00 : 39[63000] -> 38[43000] via P2P/IPC comm 0x2ba520000ab0 nRanks 96 e08r3n01:6279:7255 [3] NCCL INFO Channel 00 : 55[63000] -> 54[43000] via P2P/IPC comm 0x2aea58000ab0 nRanks 96 e08r3n00:14536:15487 [3] NCCL INFO Channel 01 : 51[63000] -> 50[43000] via P2P/IPC comm 0x2b7774000ab0 nRanks 96 e08r2n13:23995:25163 [3] NCCL INFO Channel 01 : 23[63000] -> 22[43000] via P2P/IPC comm 0x2b4b08000ab0 nRanks 96 e08r2n15:22025:23017 [3] NCCL INFO Connected all rings comm 0x2b3208000ab0 nRanks 96 busId 63000 e08r2n15:22025:23017 [3] NCCL INFO Channel 00 : 31[63000] -> 30[43000] via P2P/IPC comm 0x2b3208000ab0 nRanks 96 e08r2n17:21284:22443 [3] NCCL INFO Channel 01 : 39[63000] -> 38[43000] via P2P/IPC comm 0x2ba520000ab0 nRanks 96 e08r3n01:6279:7255 [3] NCCL INFO Channel 01 : 55[63000] -> 54[43000] via P2P/IPC comm 0x2aea58000ab0 nRanks 96 e08r3n10:18788:19808 [3] NCCL INFO Connected all trees comm 0x2ad848000ab0 nRanks 96 busId 63000 e08r3n02:30405:31208 [3] NCCL INFO Connected all rings comm 0x2b6924000ab0 nRanks 96 busId 63000 e08r3n10:18788:19808 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30405:31208 [3] NCCL INFO Channel 00 : 59[63000] -> 58[43000] via P2P/IPC comm 0x2b6924000ab0 nRanks 96 e08r2n15:22025:23017 [3] NCCL INFO Channel 01 : 31[63000] -> 30[43000] via P2P/IPC comm 0x2b3208000ab0 nRanks 96 e08r3n10:18788:19808 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8671:9661 [0] NCCL INFO Connected all rings comm 0x2b66f4000ab0 nRanks 96 busId 4000 e08r2n18:755:1882 [3] NCCL INFO Connected all rings comm 0x2b7fac000ab0 nRanks 96 busId 63000 e08r2n18:755:1882 [3] NCCL INFO Channel 00 : 43[63000] -> 42[43000] via P2P/IPC comm 0x2b7fac000ab0 nRanks 96 e08r3n02:30405:31208 [3] NCCL INFO Channel 01 : 59[63000] -> 58[43000] via P2P/IPC comm 0x2b6924000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Connected all rings comm 0x2b5d18000ab0 nRanks 96 busId 4000 e08r2n18:755:1882 [3] NCCL INFO Channel 01 : 43[63000] -> 42[43000] via P2P/IPC comm 0x2b7fac000ab0 nRanks 96 e08r2n16:13446:14609 [3] NCCL INFO Connected all trees comm 0x2abfb8000ab0 nRanks 96 busId 63000 e08r2n16:13446:14609 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13446:14609 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27006:27966 [3] NCCL INFO Connected all trees comm 0x2b56e4000ab0 nRanks 96 busId 63000 e08r3n10:18784:19834 [0] NCCL INFO Connected all rings comm 0x2af008000ab0 nRanks 96 busId 4000 e08r2n17:21280:22441 [0] NCCL INFO Connected all rings comm 0x2aff88000ab0 nRanks 96 busId 4000 e08r2n09:27006:27966 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27006:27966 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5734:6772 [3] NCCL INFO Connected all trees comm 0x2b4144000ab0 nRanks 96 busId 63000 e08r2n16:13442:14572 [0] NCCL INFO Connected all rings comm 0x2b4aa4000ab0 nRanks 96 busId 4000 e08r2n11:5734:6772 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5734:6772 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23991:25150 [0] NCCL INFO Connected all rings comm 0x2b5014000ab0 nRanks 96 busId 4000 e08r3n02:30401:31205 [0] NCCL INFO Connected all rings comm 0x2bab5c000ab0 nRanks 96 busId 4000 e08r2n14:18192:19156 [0] NCCL INFO Connected all rings comm 0x2b88b4000ab0 nRanks 96 busId 4000 e08r3n00:14532:15473 [0] NCCL INFO Connected all rings comm 0x2abe48000ab0 nRanks 96 busId 4000 e08r2n14:18196:19160 [3] NCCL INFO Connected all trees comm 0x2ab5e8000ab0 nRanks 96 busId 63000 e08r2n14:18196:19160 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18196:19160 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9034:10156 [3] NCCL INFO Connected all trees comm 0x2b6940000ab0 nRanks 96 busId 63000 e08r3n00:14536:15487 [3] NCCL INFO Connected all trees comm 0x2b7774000ab0 nRanks 96 busId 63000 e08r2n19:9034:10156 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9034:10156 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14536:15487 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n00:14536:15487 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23995:25163 [3] NCCL INFO Connected all trees comm 0x2b4b08000ab0 nRanks 96 busId 63000 e08r2n13:23995:25163 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23995:25163 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21284:22443 [3] NCCL INFO Connected all trees comm 0x2ba520000ab0 nRanks 96 busId 63000 e08r3n03:22735:23820 [0] NCCL INFO Connected all rings comm 0x2b4504000ab0 nRanks 96 busId 4000 e08r2n17:21284:22443 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21284:22443 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6275:7256 [0] NCCL INFO Connected all rings comm 0x2b8738000ab0 nRanks 96 busId 4000 e08r2n18:751:1877 [0] NCCL INFO Connected all rings comm 0x2b8134000ab0 nRanks 96 busId 4000 e08r3n01:6279:7255 [3] NCCL INFO Connected all trees comm 0x2aea58000ab0 nRanks 96 busId 63000 e08r3n01:6279:7255 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6279:7255 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9030:10143 [0] NCCL INFO Connected all rings comm 0x2ab408000ab0 nRanks 96 busId 4000 e08r2n15:22025:23017 [3] NCCL INFO Connected all trees comm 0x2b3208000ab0 nRanks 96 busId 63000 e08r2n15:22025:23017 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22025:23017 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30405:31208 [3] NCCL INFO Connected all trees comm 0x2b6924000ab0 nRanks 96 busId 63000 e08r3n02:30405:31208 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30405:31208 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:755:1882 [3] NCCL INFO Connected all trees comm 0x2b7fac000ab0 nRanks 96 busId 63000 e08r2n18:755:1882 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:755:1882 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:17745 [0] NCCL INFO Channel 01/0 : 64[4000] -> 68[4000] [send] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 01/0 : 69[26000] -> 72[4000] [receive] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 01/0 : 80[4000] -> 84[4000] [send] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 01/0 : 0[4000] -> 4[4000] [send] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01/0 : 64[4000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 00/0 : 72[4000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01/0 : 80[4000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 00/0 : 8[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 01/0 : 5[26000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 01/0 : 0[4000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 00/0 : 88[4000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 01/0 : 16[4000] -> 20[4000] [send] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 01/0 : 32[4000] -> 36[4000] [send] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 00/0 : 24[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 01/0 : 21[26000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 01/0 : 32[4000] -> 36[4000] [receive] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 01/0 : 85[26000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 01/0 : 48[4000] -> 52[4000] [send] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01/0 : 16[4000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 01/0 : 53[26000] -> 56[4000] [receive] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 01/0 : 37[26000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01/0 : 48[4000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 00/0 : 40[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 00/0 : 56[4000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Channel 01/0 : 72[4000] -> 69[26000] [receive] via NET/IB/0 comm 0x2ab9d4000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 00/0 : 64[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 00/0 : 80[4000] -> 88[4000] [send] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 00/0 : 64[4000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r2n09:27004:27956 [1] NCCL INFO Channel 01/0 : 8[4000] -> 5[26000] [receive] via NET/IB/0 comm 0x2af6e0000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 00/0 : 68[4000] -> 73[26000] [send] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 00/0 : 4[4000] -> 9[26000] [send] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r2n13:23993:25161 [1] NCCL INFO Channel 01/0 : 24[4000] -> 21[26000] [receive] via NET/IB/0 comm 0x2b4058000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00/0 : 16[4000] -> 24[4000] [send] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00/0 : 32[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 00/0 : 84[4000] -> 89[26000] [send] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 00/0 : 72[4000] -> 76[4000] [send] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Channel 01/0 : 88[4000] -> 85[26000] [receive] via NET/IB/0 comm 0x2b4344000ab0 nRanks 96 e08r3n01:6277:7260 [1] NCCL INFO Channel 01/0 : 56[4000] -> 53[26000] [receive] via NET/IB/0 comm 0x2ba34c000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 00/0 : 48[4000] -> 56[4000] [send] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00/0 : 8[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 00/0 : 20[4000] -> 25[26000] [send] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 00/0 : 36[4000] -> 41[26000] [send] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00/0 : 88[4000] -> 92[4000] [send] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 00/0 : 52[4000] -> 57[26000] [send] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r2n17:21282:22447 [1] NCCL INFO Channel 01/0 : 40[4000] -> 37[26000] [receive] via NET/IB/0 comm 0x2abf00000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 00/0 : 56[4000] -> 60[4000] [send] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 00/0 : 24[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 00/0 : 40[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01/0 : 68[4000] -> 76[4000] [send] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 01/0 : 4[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 00/0 : 72[4000] -> 81[26000] [send] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01/0 : 77[26000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00/0 : 8[4000] -> 17[26000] [send] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01/0 : 13[26000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Channel 00/0 : 73[26000] -> 68[4000] [send] via NET/IB/0 comm 0x2b9a88000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 01/0 : 36[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00/0 : 80[4000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01/0 : 45[26000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r2n10:874:1920 [1] NCCL INFO Channel 00/0 : 9[26000] -> 4[4000] [send] via NET/IB/0 comm 0x2b1f10000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 00/0 : 48[4000] -> 56[4000] [receive] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 00/0 : 89[26000] -> 84[4000] [send] via NET/IB/0 comm 0x2ac35c000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 00/0 : 16[4000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01/0 : 68[4000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 00/0 : 25[26000] -> 20[4000] [send] via NET/IB/0 comm 0x2b43b4000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 00/0 : 40[4000] -> 49[26000] [send] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n02:30403:31209 [1] NCCL INFO Channel 00/0 : 57[26000] -> 52[4000] [send] via NET/IB/0 comm 0x2ba198000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Channel 00/0 : 41[26000] -> 36[4000] [send] via NET/IB/0 comm 0x2b30f4000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01/0 : 4[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 01/0 : 92[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01/0 : 44[4000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01/0 : 12[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 01/0 : 36[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 01/0 : 84[4000] -> 77[26000] [receive] via NET/IB/0 comm 0x2b7a94000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 00/0 : 81[26000] -> 72[4000] [receive] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00/0 : 17[26000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Channel 01/0 : 52[4000] -> 45[26000] [receive] via NET/IB/0 comm 0x2af5f8000ab0 nRanks 96 e08r2n11:5732:6769 [1] NCCL INFO Channel 01/0 : 20[4000] -> 13[26000] [receive] via NET/IB/0 comm 0x2b11a0000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Channel 00/0 : 81[26000] -> 72[4000] [send] via NET/IB/0 comm 0x2b1954000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 00/0 : 64[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 00/0 : 32[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01/0 : 84[4000] -> 77[26000] [send] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01/0 : 76[4000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 00/0 : 49[26000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00/0 : 16[4000] -> 33[26000] [send] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01/0 : 20[4000] -> 13[26000] [send] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 00/0 : 17[26000] -> 8[4000] [send] via NET/IB/0 comm 0x2b92b8000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01/0 : 61[26000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01/0 : 52[4000] -> 45[26000] [send] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 01/0 : 12[4000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r3n02:30401:31205 [0] NCCL INFO Channel 00/0 : 56[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00/0 : 88[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n00:14534:15491 [1] NCCL INFO Channel 00/0 : 49[26000] -> 40[4000] [send] via NET/IB/0 comm 0x2b8bd0000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 00/0 : 24[4000] -> 16[4000] [send] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 01/0 : 44[4000] -> 36[4000] [receive] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01/0 : 12[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 01/0 : 44[4000] -> 60[4000] [send] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Channel 00 : 81[26000] -> 80[4000] via P2P/IPC comm 0x2b1954000ab0 nRanks 96 e08r3n08:13436:14594 [1] NCCL INFO Channel 01 : 81[26000] -> 80[4000] via P2P/IPC comm 0x2b1954000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 00 : 17[26000] -> 16[4000] via P2P/IPC comm 0x2b92b8000ab0 nRanks 96 e08r2n12:8673:9656 [1] NCCL INFO Channel 01 : 17[26000] -> 16[4000] via P2P/IPC comm 0x2b92b8000ab0 nRanks 96 e08r3n08:13437:14595 [2] NCCL INFO Connected all trees comm 0x2b8f38000ab0 nRanks 96 busId 43000 e08r3n08:13437:14595 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13437:14595 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8674:9663 [2] NCCL INFO Connected all trees comm 0x2b65a0000ab0 nRanks 96 busId 43000 e08r2n12:8674:9663 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n00:14534:15491 [1] NCCL INFO Channel 00 : 49[26000] -> 48[4000] via P2P/IPC comm 0x2b8bd0000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14534:15491 [1] NCCL INFO Channel 01 : 49[26000] -> 48[4000] via P2P/IPC comm 0x2b8bd0000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 00 : 77[26000] -> 76[4000] via P2P/IPC comm 0x2b7a94000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO Channel 01 : 77[26000] -> 76[4000] via P2P/IPC comm 0x2b7a94000ab0 nRanks 96 e08r2n11:5732:6769 [1] NCCL INFO Channel 00 : 13[26000] -> 12[4000] via P2P/IPC comm 0x2b11a0000ab0 nRanks 96 e08r2n11:5732:6769 [1] NCCL INFO Channel 01 : 13[26000] -> 12[4000] via P2P/IPC comm 0x2b11a0000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Channel 00 : 45[26000] -> 44[4000] via P2P/IPC comm 0x2af5f8000ab0 nRanks 96 e08r3n07:4892:5963 [2] NCCL INFO Connected all trees comm 0x2b9670000ab0 nRanks 96 busId 43000 e08r3n07:4892:5963 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4892:5963 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9032:10150 [1] NCCL INFO Channel 01 : 45[26000] -> 44[4000] via P2P/IPC comm 0x2af5f8000ab0 nRanks 96 e08r3n00:14535:15492 [2] NCCL INFO Connected all trees comm 0x2baf68000ab0 nRanks 96 busId 43000 e08r3n00:14535:15492 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n00:14535:15492 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5733:6773 [2] NCCL INFO Connected all trees comm 0x2ae6f0000ab0 nRanks 96 busId 43000 e08r2n11:5733:6773 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5733:6773 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9033:10155 [2] NCCL INFO Connected all trees comm 0x2b03ac000ab0 nRanks 96 busId 43000 e08r2n19:9033:10155 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9033:10155 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8675:9723 [0] NCCL INFO Channel 00/0 : 89[26000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 00/0 : 64[4000] -> 0[4000] [send] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00/0 : 33[26000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00/0 : 32[4000] -> 65[26000] [send] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 00/0 : 25[26000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 00/0 : 57[26000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 00/0 : 76[4000] -> 72[4000] [receive] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 00/0 : 80[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 00/0 : 48[4000] -> 32[4000] [send] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r3n03:22737:23845 [1] NCCL INFO Channel 01/0 : 76[4000] -> 61[26000] [receive] via NET/IB/0 comm 0x2ac6a0000ab0 nRanks 96 e08r2n16:13444:14576 [1] NCCL INFO Channel 00/0 : 33[26000] -> 16[4000] [send] via NET/IB/0 comm 0x2b0180000ab0 nRanks 96 e08r2n10:872:1911 [0] NCCL INFO Channel 00/0 : 12[4000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01/0 : 76[4000] -> 61[26000] [send] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01/0 : 28[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 01/0 : 60[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Channel 00/0 : 44[4000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01/0 : 92[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01/0 : 29[26000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 00 : 89[26000] -> 88[4000] via P2P/IPC comm 0x2ac35c000ab0 nRanks 96 e08r3n10:18786:19830 [1] NCCL INFO Channel 01 : 89[26000] -> 88[4000] via P2P/IPC comm 0x2ac35c000ab0 nRanks 96 e08r2n16:13444:14576 [1] NCCL INFO Channel 00 : 33[26000] -> 32[4000] via P2P/IPC comm 0x2b0180000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 00 : 25[26000] -> 24[4000] via P2P/IPC comm 0x2b43b4000ab0 nRanks 96 e08r2n16:13444:14576 [1] NCCL INFO Channel 01 : 33[26000] -> 32[4000] via P2P/IPC comm 0x2b0180000ab0 nRanks 96 e08r2n14:18194:19155 [1] NCCL INFO Channel 01 : 25[26000] -> 24[4000] via P2P/IPC comm 0x2b43b4000ab0 nRanks 96 e08r3n10:18787:19820 [2] NCCL INFO Connected all trees comm 0x2ae6c4000ab0 nRanks 96 busId 43000 e08r3n10:18787:19820 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18787:19820 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30403:31209 [1] NCCL INFO Channel 00 : 57[26000] -> 56[4000] via P2P/IPC comm 0x2ba198000ab0 nRanks 96 e08r3n02:30403:31209 [1] NCCL INFO Channel 01 : 57[26000] -> 56[4000] via P2P/IPC comm 0x2ba198000ab0 nRanks 96 e08r2n16:13445:14603 [2] NCCL INFO Connected all trees comm 0x2b67e4000ab0 nRanks 96 busId 43000 e08r2n16:13445:14603 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18195:19161 [2] NCCL INFO Connected all trees comm 0x2b74c4000ab0 nRanks 96 busId 43000 e08r2n16:13445:14603 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18195:19161 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18195:19161 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30404:31213 [2] NCCL INFO Connected all trees comm 0x2b67ac000ab0 nRanks 96 busId 43000 e08r3n02:30404:31213 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30404:31213 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22737:23845 [1] NCCL INFO Channel 00 : 61[26000] -> 60[4000] via P2P/IPC comm 0x2ac6a0000ab0 nRanks 96 e08r3n03:22737:23845 [1] NCCL INFO Channel 01 : 61[26000] -> 60[4000] via P2P/IPC comm 0x2ac6a0000ab0 nRanks 96 e08r3n03:22738:23847 [2] NCCL INFO Connected all trees comm 0x2af43c000ab0 nRanks 96 busId 43000 e08r3n03:22738:23847 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22738:23847 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:17745 [0] NCCL INFO Channel 00/0 : 0[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00/0 : 65[26000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 00/0 : 65[26000] -> 32[4000] [send] via NET/IB/0 comm 0x2b0b78000ab0 nRanks 96 e08r3n09:8675:9723 [0] NCCL INFO Channel 01/0 : 84[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2b416c000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Channel 01/0 : 76[4000] -> 68[4000] [send] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 00/0 : 0[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Channel 01/0 : 20[4000] -> 16[4000] [send] via NET/IB/0 comm 0x2b5014000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 00/0 : 24[4000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Channel 01/0 : 52[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2b8738000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 01/0 : 28[4000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r2n15:22023:23011 [1] NCCL INFO Channel 01/0 : 60[4000] -> 29[26000] [receive] via NET/IB/0 comm 0x2ad4b8000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01/0 : 28[4000] -> 92[4000] [send] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01/0 : 60[4000] -> 29[26000] [send] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 00 : 65[26000] -> 64[4000] via P2P/IPC comm 0x2b0b78000ab0 nRanks 96 e08r3n04:16938:17748 [1] NCCL INFO Channel 01 : 65[26000] -> 64[4000] via P2P/IPC comm 0x2b0b78000ab0 nRanks 96 e08r3n04:16939:17749 [2] NCCL INFO Connected all trees comm 0x2b4eb4000ab0 nRanks 96 busId 43000 e08r3n04:16939:17749 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16939:17749 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n15:22023:23011 [1] NCCL INFO Channel 00 : 29[26000] -> 28[4000] via P2P/IPC comm 0x2ad4b8000ab0 nRanks 96 e08r2n15:22023:23011 [1] NCCL INFO Channel 01 : 29[26000] -> 28[4000] via P2P/IPC comm 0x2ad4b8000ab0 nRanks 96 e08r2n15:22024:23016 [2] NCCL INFO Connected all trees comm 0x2b123c000ab0 nRanks 96 busId 43000 e08r2n15:22024:23016 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22024:23016 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4889:5932 [0] NCCL INFO Channel 00/0 : 76[4000] -> 72[4000] [send] via NET/IB/0 comm 0x2aed78000ab0 nRanks 96 e08r2n08:5136:6335 [0] NCCL INFO Channel 01/0 : 4[4000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b2e44000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 00/0 : 48[4000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 00/0 : 28[4000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 00/0 : 80[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r2n12:8671:9661 [0] NCCL INFO Channel 01/0 : 20[4000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b66f4000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 00/0 : 73[26000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 01/0 : 28[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 01/0 : 60[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r3n11:29645:30741 [0] NCCL INFO Channel 00/0 : 92[4000] -> 88[4000] [send] via NET/IB/0 comm 0x2ac238000ab0 nRanks 96 e08r3n07:4889:5932 [0] NCCL INFO Connected all trees comm 0x2aed78000ab0 nRanks 96 busId 4000 e08r3n07:4889:5932 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4889:5932 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4891:5944 [1] NCCL INFO Connected all trees comm 0x2b7a94000ab0 nRanks 96 busId 26000 e08r3n07:4891:5944 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4891:5944 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n06:22283:23339 [1] NCCL INFO Channel 00 : 73[26000] -> 72[4000] via P2P/IPC comm 0x2b9a88000ab0 nRanks 96 e08r3n06:22283:23339 [1] NCCL INFO Channel 01 : 73[26000] -> 72[4000] via P2P/IPC comm 0x2b9a88000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO Connected all trees comm 0x2b141c000ab0 nRanks 96 busId 43000 e08r3n06:22284:23338 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22284:23338 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8671:9661 [0] NCCL INFO Connected all trees comm 0x2b66f4000ab0 nRanks 96 busId 4000 e08r2n12:8671:9661 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8671:9661 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8673:9656 [1] NCCL INFO Connected all trees comm 0x2b92b8000ab0 nRanks 96 busId 26000 e08r2n12:8673:9656 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8673:9656 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14532:15473 [0] NCCL INFO Channel 00/0 : 56[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 00/0 : 88[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Channel 01/0 : 72[4000] -> 69[26000] [send] via NET/IB/0 comm 0x2af9e0000ab0 nRanks 96 e08r2n16:13442:14572 [0] NCCL INFO Channel 01/0 : 36[4000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4aa4000ab0 nRanks 96 e08r3n04:16936:17745 [0] NCCL INFO Channel 01/0 : 68[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b3574000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Channel 00/0 : 28[4000] -> 24[4000] [send] via NET/IB/0 comm 0x2b5d18000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO Channel 01/0 : 68[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2b85d4000ab0 nRanks 96 e08r3n03:22735:23820 [0] NCCL INFO Channel 00/0 : 60[4000] -> 56[4000] [send] via NET/IB/0 comm 0x2b4504000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 01/0 : 12[4000] -> 4[4000] [send] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Channel 01/0 : 44[4000] -> 36[4000] [send] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r3n06:22281:23330 [0] NCCL INFO Connected all trees comm 0x2af9e0000ab0 nRanks 96 busId 4000 e08r3n06:22281:23330 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22281:23330 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n06:22283:23339 [1] NCCL INFO Connected all trees comm 0x2b9a88000ab0 nRanks 96 busId 26000 e08r3n06:22283:23339 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22283:23339 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24733:25802 [1] NCCL INFO Channel 00 : 69[26000] -> 68[4000] via P2P/IPC comm 0x2ab9d4000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO Channel 01 : 69[26000] -> 68[4000] via P2P/IPC comm 0x2ab9d4000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO Connected all trees comm 0x2b5d18000ab0 nRanks 96 busId 4000 e08r2n15:22021:22997 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22021:22997 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n15:22023:23011 [1] NCCL INFO Connected all trees comm 0x2ad4b8000ab0 nRanks 96 busId 26000 e08r2n15:22023:23011 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22023:23011 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24731:25791 [0] NCCL INFO Connected all trees comm 0x2b85d4000ab0 nRanks 96 busId 4000 e08r3n05:24731:25791 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24731:25791 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24734:25804 [2] NCCL INFO Connected all trees comm 0x2b26b0000ab0 nRanks 96 busId 43000 e08r3n05:24733:25802 [1] NCCL INFO Connected all trees comm 0x2ab9d4000ab0 nRanks 96 busId 26000 e08r3n05:24734:25804 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24734:25804 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24733:25802 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24733:25802 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:17745 [0] NCCL INFO Connected all trees comm 0x2b3574000ab0 nRanks 96 busId 4000 e08r3n04:16936:17745 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16936:17745 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16938:17748 [1] NCCL INFO Connected all trees comm 0x2b0b78000ab0 nRanks 96 busId 26000 e08r3n04:16938:17748 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16938:17748 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30401:31205 [0] NCCL INFO Channel 00/0 : 60[4000] -> 56[4000] [receive] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 00/0 : 92[4000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n00:14532:15473 [0] NCCL INFO Channel 01/0 : 52[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2abe48000ab0 nRanks 96 e08r3n08:13434:14586 [0] NCCL INFO Channel 01/0 : 84[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abcf4000ab0 nRanks 96 e08r2n14:18192:19156 [0] NCCL INFO Channel 01/0 : 24[4000] -> 21[26000] [send] via NET/IB/0 comm 0x2b88b4000ab0 nRanks 96 e08r2n11:5730:6763 [0] NCCL INFO Channel 00/0 : 12[4000] -> 8[4000] [send] via NET/IB/0 comm 0x2b7a5c000ab0 nRanks 96 e08r3n07:4891:5944 [1] NCCL INFO comm 0x2b7a94000ab0 rank 77 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9030:10143 [0] NCCL INFO Channel 00/0 : 44[4000] -> 40[4000] [send] via NET/IB/0 comm 0x2ab408000ab0 nRanks 96 e08r2n09:27002:27953 [0] NCCL INFO Channel 00/0 : 9[26000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Channel 00/0 : 41[26000] -> 36[4000] [receive] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r2n12:8674:9663 [2] NCCL INFO comm 0x2b65a0000ab0 rank 18 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n12:8671:9661 [0] NCCL INFO comm 0x2b66f4000ab0 rank 16 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n12:8675:9665 [3] NCCL INFO comm 0x2b2e18000ab0 rank 19 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n12:8673:9656 [1] NCCL INFO comm 0x2b92b8000ab0 rank 17 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n07:4889:5932 [0] NCCL INFO comm 0x2aed78000ab0 rank 76 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n07:4893:5961 [3] NCCL INFO comm 0x2ba69c000ab0 rank 79 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n07:4892:5963 [2] NCCL INFO comm 0x2b9670000ab0 rank 78 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n03:22735:23820 [0] NCCL INFO Connected all trees comm 0x2b4504000ab0 nRanks 96 busId 4000 e08r3n03:22735:23820 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22735:23820 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22737:23845 [1] NCCL INFO Connected all trees comm 0x2ac6a0000ab0 nRanks 96 busId 26000 e08r3n03:22737:23845 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22737:23845 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n11:29645:30741 [0] NCCL INFO Connected all trees comm 0x2ac238000ab0 nRanks 96 busId 4000 e08r3n11:29645:30741 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29645:30741 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n11:29647:30751 [1] NCCL INFO Connected all trees comm 0x2abd10000ab0 nRanks 96 busId 26000 e08r3n11:29647:30751 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29647:30751 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5730:6763 [0] NCCL INFO Connected all trees comm 0x2b7a5c000ab0 nRanks 96 busId 4000 e08r2n11:5730:6763 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5730:6763 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18192:19156 [0] NCCL INFO Connected all trees comm 0x2b88b4000ab0 nRanks 96 busId 4000 e08r2n14:18192:19156 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18192:19156 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14532:15473 [0] NCCL INFO Connected all trees comm 0x2abe48000ab0 nRanks 96 busId 4000 e08r3n00:14532:15473 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5732:6769 [1] NCCL INFO Connected all trees comm 0x2b11a0000ab0 nRanks 96 busId 26000 e08r3n00:14532:15473 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5732:6769 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5732:6769 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18194:19155 [1] NCCL INFO Connected all trees comm 0x2b43b4000ab0 nRanks 96 busId 26000 e08r2n14:18194:19155 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18194:19155 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14534:15491 [1] NCCL INFO Connected all trees comm 0x2b8bd0000ab0 nRanks 96 busId 26000 e08r3n00:14534:15491 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n00:14534:15491 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n08:13434:14586 [0] NCCL INFO Connected all trees comm 0x2abcf4000ab0 nRanks 96 busId 4000 e08r3n08:13434:14586 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13434:14586 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n08:13436:14594 [1] NCCL INFO Connected all trees comm 0x2b1954000ab0 nRanks 96 busId 26000 e08r3n08:13436:14594 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13436:14594 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23993:25161 [1] NCCL INFO Channel 00 : 21[26000] -> 20[4000] via P2P/IPC comm 0x2b4058000ab0 nRanks 96 e08r2n19:9030:10143 [0] NCCL INFO Connected all trees comm 0x2ab408000ab0 nRanks 96 busId 4000 e08r2n19:9030:10143 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9030:10143 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23993:25161 [1] NCCL INFO Channel 01 : 21[26000] -> 20[4000] via P2P/IPC comm 0x2b4058000ab0 nRanks 96 e08r2n19:9032:10150 [1] NCCL INFO Connected all trees comm 0x2af5f8000ab0 nRanks 96 busId 26000 e08r2n19:9032:10150 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9032:10150 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:874:1920 [1] NCCL INFO Channel 00 : 9[26000] -> 8[4000] via P2P/IPC comm 0x2b1f10000ab0 nRanks 96 e08r2n10:874:1920 [1] NCCL INFO Channel 01 : 9[26000] -> 8[4000] via P2P/IPC comm 0x2b1f10000ab0 nRanks 96 e08r2n13:23991:25150 [0] NCCL INFO Connected all trees comm 0x2b5014000ab0 nRanks 96 busId 4000 e08r2n13:23991:25150 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23991:25150 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23994:25164 [2] NCCL INFO Connected all trees comm 0x2b5d8c000ab0 nRanks 96 busId 43000 e08r2n13:23993:25161 [1] NCCL INFO Connected all trees comm 0x2b4058000ab0 nRanks 96 busId 26000 e08r2n13:23993:25161 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23994:25164 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23994:25164 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23993:25161 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:875:1919 [2] NCCL INFO Connected all trees comm 0x2af8c4000ab0 nRanks 96 busId 43000 e08r2n10:875:1919 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:875:1919 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:753:1883 [1] NCCL INFO Channel 00 : 41[26000] -> 40[4000] via P2P/IPC comm 0x2b30f4000ab0 nRanks 96 e08r2n18:753:1883 [1] NCCL INFO Channel 01 : 41[26000] -> 40[4000] via P2P/IPC comm 0x2b30f4000ab0 nRanks 96 e08r2n18:754:1880 [2] NCCL INFO Connected all trees comm 0x2b2a28000ab0 nRanks 96 busId 43000 e08r2n18:754:1880 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:754:1880 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30401:31205 [0] NCCL INFO Channel 01/0 : 56[4000] -> 53[26000] [send] via NET/IB/0 comm 0x2bab5c000ab0 nRanks 96 e08r3n10:18784:19834 [0] NCCL INFO Channel 01/0 : 88[4000] -> 85[26000] [send] via NET/IB/0 comm 0x2af008000ab0 nRanks 96 e08r3n06:22284:23338 [2] NCCL INFO comm 0x2b141c000ab0 rank 74 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n06:22281:23330 [0] NCCL INFO comm 0x2af9e0000ab0 rank 72 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:872:1911 [0] NCCL INFO Channel 01/0 : 8[4000] -> 5[26000] [send] via NET/IB/0 comm 0x2b6040000ab0 nRanks 96 e08r2n15:22021:22997 [0] NCCL INFO comm 0x2b5d18000ab0 rank 28 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n15:22024:23016 [2] NCCL INFO comm 0x2b123c000ab0 rank 30 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n15:22025:23017 [3] NCCL INFO comm 0x2b3208000ab0 rank 31 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:751:1877 [0] NCCL INFO Channel 01/0 : 40[4000] -> 37[26000] [send] via NET/IB/0 comm 0x2b8134000ab0 nRanks 96 e08r3n05:24733:25802 [1] NCCL INFO comm 0x2ab9d4000ab0 rank 69 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n05:24735:25797 [3] NCCL INFO comm 0x2ac218000ab0 rank 71 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n09:27002:27953 [0] NCCL INFO Channel 01/0 : 4[4000] -> 0[4000] [send] via NET/IB/0 comm 0x2b0d1c000ab0 nRanks 96 e08r3n05:24731:25791 [0] NCCL INFO comm 0x2b85d4000ab0 rank 68 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n05:24734:25804 [2] NCCL INFO comm 0x2b26b0000ab0 rank 70 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n04:16936:17745 [0] NCCL INFO comm 0x2b3574000ab0 rank 64 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n04:16939:17749 [2] NCCL INFO comm 0x2b4eb4000ab0 rank 66 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21280:22441 [0] NCCL INFO Channel 01/0 : 36[4000] -> 32[4000] [send] via NET/IB/0 comm 0x2aff88000ab0 nRanks 96 e08r3n04:16940:17743 [3] NCCL INFO comm 0x2b1e28000ab0 rank 67 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n04:16938:17748 [1] NCCL INFO comm 0x2b0b78000ab0 rank 65 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n06:22285:23335 [3] NCCL INFO comm 0x2b91b4000ab0 rank 75 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n06:22283:23339 [1] NCCL INFO comm 0x2b9a88000ab0 rank 73 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n15:22023:23011 [1] NCCL INFO comm 0x2ad4b8000ab0 rank 29 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30401:31205 [0] NCCL INFO Connected all trees comm 0x2bab5c000ab0 nRanks 96 busId 4000 e08r3n02:30401:31205 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30401:31205 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30403:31209 [1] NCCL INFO Connected all trees comm 0x2ba198000ab0 nRanks 96 busId 26000 e08r3n02:30403:31209 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30403:31209 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n10:18784:19834 [0] NCCL INFO Connected all trees comm 0x2af008000ab0 nRanks 96 busId 4000 e08r3n10:18784:19834 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18784:19834 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n10:18786:19830 [1] NCCL INFO Connected all trees comm 0x2ac35c000ab0 nRanks 96 busId 26000 e08r3n10:18786:19830 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18786:19830 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6277:7260 [1] NCCL INFO Channel 00 : 53[26000] -> 52[4000] via P2P/IPC comm 0x2ba34c000ab0 nRanks 96 e08r3n01:6277:7260 [1] NCCL INFO Channel 01 : 53[26000] -> 52[4000] via P2P/IPC comm 0x2ba34c000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Channel 00 : 85[26000] -> 84[4000] via P2P/IPC comm 0x2b4344000ab0 nRanks 96 e08r3n09:8677:9721 [1] NCCL INFO Channel 01 : 85[26000] -> 84[4000] via P2P/IPC comm 0x2b4344000ab0 nRanks 96 e08r3n01:6275:7256 [0] NCCL INFO Connected all trees comm 0x2b8738000ab0 nRanks 96 busId 4000 e08r3n01:6275:7256 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6275:7256 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6278:7261 [2] NCCL INFO Connected all trees comm 0x2b101c000ab0 nRanks 96 busId 43000 e08r3n01:6277:7260 [1] NCCL INFO Connected all trees comm 0x2ba34c000ab0 nRanks 96 busId 26000 e08r3n01:6278:7261 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6278:7261 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6277:7260 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6277:7260 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8675:9723 [0] NCCL INFO Connected all trees comm 0x2b416c000ab0 nRanks 96 busId 4000 e08r3n09:8675:9723 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8675:9723 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8677:9721 [1] NCCL INFO Connected all trees comm 0x2b4344000ab0 nRanks 96 busId 26000 e08r3n09:8677:9721 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8678:9738 [2] NCCL INFO Connected all trees comm 0x2b20f8000ab0 nRanks 96 busId 43000 e08r3n09:8677:9721 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8678:9738 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8678:9738 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:872:1911 [0] NCCL INFO Connected all trees comm 0x2b6040000ab0 nRanks 96 busId 4000 e08r2n10:872:1911 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:872:1911 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:874:1920 [1] NCCL INFO Connected all trees comm 0x2b1f10000ab0 nRanks 96 busId 26000 e08r2n10:874:1920 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:874:1920 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27004:27956 [1] NCCL INFO Channel 00 : 5[26000] -> 4[4000] via P2P/IPC comm 0x2af6e0000ab0 nRanks 96 e08r2n09:27004:27956 [1] NCCL INFO Channel 01 : 5[26000] -> 4[4000] via P2P/IPC comm 0x2af6e0000ab0 nRanks 96 e08r2n18:751:1877 [0] NCCL INFO Connected all trees comm 0x2b8134000ab0 nRanks 96 busId 4000 e08r2n18:751:1877 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:751:1877 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:753:1883 [1] NCCL INFO Connected all trees comm 0x2b30f4000ab0 nRanks 96 busId 26000 e08r2n18:753:1883 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:753:1883 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27002:27953 [0] NCCL INFO Connected all trees comm 0x2b0d1c000ab0 nRanks 96 busId 4000 e08r2n09:27002:27953 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27002:27953 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27005:27965 [2] NCCL INFO Connected all trees comm 0x2b3e48000ab0 nRanks 96 busId 43000 e08r2n09:27004:27956 [1] NCCL INFO Connected all trees comm 0x2af6e0000ab0 nRanks 96 busId 26000 e08r2n09:27005:27965 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21282:22447 [1] NCCL INFO Channel 00 : 37[26000] -> 36[4000] via P2P/IPC comm 0x2abf00000ab0 nRanks 96 e08r2n09:27004:27956 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27004:27956 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27005:27965 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21282:22447 [1] NCCL INFO Channel 01 : 37[26000] -> 36[4000] via P2P/IPC comm 0x2abf00000ab0 nRanks 96 e08r2n17:21280:22441 [0] NCCL INFO Connected all trees comm 0x2aff88000ab0 nRanks 96 busId 4000 e08r2n17:21280:22441 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21280:22441 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21283:22448 [2] NCCL INFO Connected all trees comm 0x2b9724000ab0 nRanks 96 busId 43000 e08r2n17:21283:22448 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21282:22447 [1] NCCL INFO Connected all trees comm 0x2abf00000ab0 nRanks 96 busId 26000 e08r2n17:21283:22448 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21282:22447 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21282:22447 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5136:6335 [0] NCCL INFO Connected all trees comm 0x2b2e44000ab0 nRanks 96 busId 4000 e08r2n08:5136:6335 [0] NCCL INFO Using tuning table 0 with LL128 disabled e08r2n08:5136:6335 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5136:6335 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5140:6524 [1] NCCL INFO Connected all trees comm 0x2b30cc000ab0 nRanks 96 busId 26000 e08r2n08:5140:6524 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5140:6524 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13442:14572 [0] NCCL INFO Connected all trees comm 0x2b4aa4000ab0 nRanks 96 busId 4000 e08r2n16:13442:14572 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13442:14572 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13444:14576 [1] NCCL INFO Connected all trees comm 0x2b0180000ab0 nRanks 96 busId 26000 e08r2n16:13444:14576 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13444:14576 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22738:23847 [2] NCCL INFO comm 0x2af43c000ab0 rank 62 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n03:22735:23820 [0] NCCL INFO comm 0x2b4504000ab0 rank 60 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n03:22739:23827 [3] NCCL INFO comm 0x2b0524000ab0 rank 63 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n03:22737:23845 [1] NCCL INFO comm 0x2ac6a0000ab0 rank 61 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29645:30741 [0] NCCL INFO comm 0x2ac238000ab0 rank 92 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n11:29647:30751 [1] NCCL INFO comm 0x2abd10000ab0 rank 93 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5730:6763 [0] NCCL INFO comm 0x2b7a5c000ab0 rank 12 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n00:14535:15492 [2] NCCL INFO comm 0x2baf68000ab0 rank 50 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n00:14532:15473 [0] NCCL INFO comm 0x2abe48000ab0 rank 48 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n11:5734:6772 [3] NCCL INFO comm 0x2b4144000ab0 rank 15 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n14:18192:19156 [0] NCCL INFO comm 0x2b88b4000ab0 rank 24 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n14:18195:19161 [2] NCCL INFO comm 0x2b74c4000ab0 rank 26 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5732:6769 [1] NCCL INFO comm 0x2b11a0000ab0 rank 13 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n00:14536:15487 [3] NCCL INFO comm 0x2b7774000ab0 rank 51 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n14:18196:19160 [3] NCCL INFO comm 0x2ab5e8000ab0 rank 27 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n08:13437:14595 [2] NCCL INFO comm 0x2b8f38000ab0 rank 82 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n08:13434:14586 [0] NCCL INFO comm 0x2abcf4000ab0 rank 80 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n14:18194:19155 [1] NCCL INFO comm 0x2b43b4000ab0 rank 25 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n08:13438:14591 [3] NCCL INFO comm 0x2b2614000ab0 rank 83 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n08:13436:14594 [1] NCCL INFO comm 0x2b1954000ab0 rank 81 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9033:10155 [2] NCCL INFO comm 0x2b03ac000ab0 rank 46 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9032:10150 [1] NCCL INFO comm 0x2af5f8000ab0 rank 45 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n13:23994:25164 [2] NCCL INFO comm 0x2b5d8c000ab0 rank 22 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29648:30753 [2] NCCL INFO comm 0x2b8da8000ab0 rank 94 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29649:30749 [3] NCCL INFO comm 0x2ba6ec000ab0 rank 95 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23995:25163 [3] NCCL INFO comm 0x2b4b08000ab0 rank 23 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n11:5733:6773 [2] NCCL INFO comm 0x2ae6f0000ab0 rank 14 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n00:14534:15491 [1] NCCL INFO comm 0x2b8bd0000ab0 rank 49 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9030:10143 [0] NCCL INFO comm 0x2ab408000ab0 rank 44 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n19:9034:10156 [3] NCCL INFO comm 0x2b6940000ab0 rank 47 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23991:25150 [0] NCCL INFO comm 0x2b5014000ab0 rank 20 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23993:25161 [1] NCCL INFO comm 0x2b4058000ab0 rank 21 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30401:31205 [0] NCCL INFO comm 0x2bab5c000ab0 rank 56 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n02:30404:31213 [2] NCCL INFO comm 0x2b67ac000ab0 rank 58 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30405:31208 [3] NCCL INFO comm 0x2b6924000ab0 rank 59 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n10:18788:19808 [3] NCCL INFO comm 0x2ad848000ab0 rank 91 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n10:18786:19830 [1] NCCL INFO comm 0x2ac35c000ab0 rank 89 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n01:6277:7260 [1] NCCL INFO comm 0x2ba34c000ab0 rank 53 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n01:6279:7255 [3] NCCL INFO comm 0x2aea58000ab0 rank 55 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n01:6275:7256 [0] NCCL INFO comm 0x2b8738000ab0 rank 52 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n01:6278:7261 [2] NCCL INFO comm 0x2b101c000ab0 rank 54 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n09:8677:9721 [1] NCCL INFO comm 0x2b4344000ab0 rank 85 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n09:8679:9728 [3] NCCL INFO comm 0x2b0c4c000ab0 rank 87 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n09:8678:9738 [2] NCCL INFO comm 0x2b20f8000ab0 rank 86 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n09:8675:9723 [0] NCCL INFO comm 0x2b416c000ab0 rank 84 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:872:1911 [0] NCCL INFO comm 0x2b6040000ab0 rank 8 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:876:1918 [3] NCCL INFO comm 0x2b2d0c000ab0 rank 11 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:874:1920 [1] NCCL INFO comm 0x2b1f10000ab0 rank 9 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n18:751:1877 [0] NCCL INFO comm 0x2b8134000ab0 rank 40 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:755:1882 [3] NCCL INFO comm 0x2b7fac000ab0 rank 43 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:753:1883 [1] NCCL INFO comm 0x2b30f4000ab0 rank 41 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30403:31209 [1] NCCL INFO comm 0x2ba198000ab0 rank 57 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n09:27004:27956 [1] NCCL INFO comm 0x2af6e0000ab0 rank 5 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n09:27002:27953 [0] NCCL INFO comm 0x2b0d1c000ab0 rank 4 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n09:27005:27965 [2] NCCL INFO comm 0x2b3e48000ab0 rank 6 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n10:18784:19834 [0] NCCL INFO comm 0x2af008000ab0 rank 88 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n10:18787:19820 [2] NCCL INFO comm 0x2ae6c4000ab0 rank 90 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21284:22443 [3] NCCL INFO comm 0x2ba520000ab0 rank 39 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n17:21282:22447 [1] NCCL INFO comm 0x2abf00000ab0 rank 37 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21283:22448 [2] NCCL INFO comm 0x2b9724000ab0 rank 38 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n08:5141:6541 [2] NCCL INFO comm 0x2b5bd8000ab0 rank 2 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n08:5142:6491 [3] NCCL INFO comm 0x2ad4a8000ab0 rank 3 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n08:5140:6524 [1] NCCL INFO comm 0x2b30cc000ab0 rank 1 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n08:5136:6335 [0] NCCL INFO comm 0x2b2e44000ab0 rank 0 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n16:13445:14603 [2] NCCL INFO comm 0x2b67e4000ab0 rank 34 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n16:13446:14609 [3] NCCL INFO comm 0x2abfb8000ab0 rank 35 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:875:1919 [2] NCCL INFO comm 0x2af8c4000ab0 rank 10 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n18:754:1880 [2] NCCL INFO comm 0x2b2a28000ab0 rank 42 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n09:27006:27966 [3] NCCL INFO comm 0x2b56e4000ab0 rank 7 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n17:21280:22441 [0] NCCL INFO comm 0x2aff88000ab0 rank 36 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n16:13442:14572 [0] NCCL INFO comm 0x2b4aa4000ab0 rank 32 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n16:13444:14576 [1] NCCL INFO comm 0x2b0180000ab0 rank 33 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE [2023-10-27 12:39:49,506] [INFO] [partition_parameters.py:454:__exit__] finished initializing model with 7.51B parameters input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 input: 写一篇关于气候变化对海洋生态的影响的文章。 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 label: 好的,以下是你要求的文章: 气候变化对海洋生态的影响 气候变化对海洋生态产生了广泛的影响。全球变暖导致海洋温度上升,这可能会对许多水生生物的生存、繁殖和迁移造成巨大的影响。另外,海洋酸化也是一个问题 Parameter Offload: Total persistent parameters: 266240 in 65 params e08r2n08:5136:8202 [0] NCCL INFO Using network IB e08r2n08:5142:8204 [3] NCCL INFO Using network IB e08r2n10:876:3570 [3] NCCL INFO Using network IB e08r2n18:753:3473 [1] NCCL INFO Using network IB e08r3n10:18788:21518 [3] NCCL INFO Using network IB e08r2n08:5141:8206 [2] NCCL INFO Using network IB e08r2n10:875:3571 [2] NCCL INFO Using network IB e08r2n18:755:3474 [3] NCCL INFO Using network IB e08r3n09:8679:11332 [3] NCCL INFO Using network IB e08r3n05:24735:27390 [3] NCCL INFO Using network IB e08r3n11:29649:32285 [3] NCCL INFO Using network IB e08r2n19:9034:11808 [3] NCCL INFO Using network IB e08r3n00:14536:16697 [3] NCCL INFO Using network IB e08r2n18:754:3475 [2] NCCL INFO Using network IB e08r3n09:8678:11333 [2] NCCL INFO Using network IB e08r3n05:24734:27392 [2] NCCL INFO Using network IB e08r3n11:29648:32286 [2] NCCL INFO Using network IB e08r3n00:14535:16698 [2] NCCL INFO Using network IB e08r3n10:18787:21519 [2] NCCL INFO Using network IB e08r2n14:18196:20819 [3] NCCL INFO Using network IB e08r3n07:4889:7203 [0] NCCL INFO Using network IB e08r2n14:18195:20820 [2] NCCL INFO Using network IB e08r3n07:4891:7204 [1] NCCL INFO Using network IB e08r3n06:22285:25007 [3] NCCL INFO Using network IB e08r2n19:9033:11810 [2] NCCL INFO Using network IB e08r3n01:6275:8490 [0] NCCL INFO Using network IB e08r2n17:21284:23952 [3] NCCL INFO Using network IB e08r3n06:22283:25009 [1] NCCL INFO Using network IB e08r3n01:6279:8492 [3] NCCL INFO Using network IB e08r2n17:21283:23951 [2] NCCL INFO Using network IB e08r2n15:22023:24652 [1] NCCL INFO Using network IB e08r2n16:13442:16162 [0] NCCL INFO Using network IB e08r3n09:8677:11336 [1] NCCL INFO Using network IB e08r3n06:22284:25008 [2] NCCL INFO Using network IB e08r3n01:6277:8491 [1] NCCL INFO Using network IB e08r2n15:22021:24653 [0] NCCL INFO Using network IB e08r2n16:13445:16161 [2] NCCL INFO Using network IB e08r3n07:4893:7208 [3] NCCL INFO Using network IB e08r3n00:14532:16701 [0] NCCL INFO Using network IB e08r2n18:751:3479 [0] NCCL INFO Using network IB e08r2n10:874:3574 [1] NCCL INFO Using network IB e08r2n19:9032:11812 [1] NCCL INFO Using network IB e08r3n11:29647:32289 [1] NCCL INFO Using network IB e08r2n08:5140:8208 [1] NCCL INFO Using network IB e08r3n01:6278:8493 [2] NCCL INFO Using network IB e08r2n15:22024:24654 [2] NCCL INFO Using network IB e08r2n16:13444:16165 [1] NCCL INFO Using network IB e08r3n07:4892:7207 [2] NCCL INFO Using network IB e08r3n00:14534:16703 [1] NCCL INFO Using network IB e08r2n19:9030:11813 [0] NCCL INFO Using network IB e08r3n11:29645:32290 [0] NCCL INFO Using network IB e08r2n11:5733:8341 [2] NCCL INFO Using network IB e08r2n15:22025:24655 [3] NCCL INFO Using network IB e08r2n16:13446:16166 [3] NCCL INFO Using network IB e08r2n11:5730:8342 [0] NCCL INFO Using network IB e08r3n04:16940:19060 [3] NCCL INFO Using network IB e08r3n02:30405:32517 [3] NCCL INFO Using network IB e08r3n09:8675:11338 [0] NCCL INFO Using network IB e08r2n10:872:3576 [0] NCCL INFO Using network IB e08r2n14:18194:20823 [1] NCCL INFO Using network IB e08r3n04:16938:19062 [1] NCCL INFO Using network IB e08r3n02:30404:32518 [2] NCCL INFO Using network IB e08r3n10:18784:21522 [0] NCCL INFO Using network IB e08r3n03:22737:25417 [1] NCCL INFO Using network IB e08r2n09:27002:29647 [0] NCCL INFO Using network IB e08r3n10:18786:21523 [1] NCCL INFO Using network IB e08r3n03:22738:25418 [2] NCCL INFO Using network IB e08r2n09:27004:29648 [1] NCCL INFO Using network IB e08r2n13:23991:26733 [0] NCCL INFO Using network IB e08r2n12:8675:11360 [3] NCCL INFO Using network IB e08r2n09:27006:29649 [3] NCCL INFO Using network IB e08r2n13:23993:26732 [1] NCCL INFO Using network IB e08r2n09:27005:29650 [2] NCCL INFO Using network IB e08r2n13:23994:26734 [2] NCCL INFO Using network IB e08r2n13:23995:26735 [3] NCCL INFO Using network IB e08r3n03:22739:25421 [3] NCCL INFO Using network IB e08r2n14:18192:20826 [0] NCCL INFO Using network IB e08r3n06:22281:25013 [0] NCCL INFO Using network IB e08r2n11:5734:8345 [3] NCCL INFO Using network IB e08r2n17:21282:23955 [1] NCCL INFO Using network IB e08r2n11:5732:8346 [1] NCCL INFO Using network IB e08r3n08:13436:16169 [1] NCCL INFO Using network IB e08r3n05:24733:27396 [1] NCCL INFO Using network IB e08r3n04:16939:19064 [2] NCCL INFO Using network IB e08r3n05:24731:27398 [0] NCCL INFO Using network IB e08r3n03:22735:25423 [0] NCCL INFO Using network IB e08r3n08:13437:16171 [2] NCCL INFO Using network IB e08r2n12:8673:11362 [1] NCCL INFO Using network IB e08r3n04:16936:19068 [0] NCCL INFO Using network IB e08r3n08:13438:16173 [3] NCCL INFO Using network IB e08r2n12:8674:11365 [2] NCCL INFO Using network IB e08r2n17:21280:23959 [0] NCCL INFO Using network IB e08r2n12:8671:11366 [0] NCCL INFO Using network IB e08r3n02:30403:32523 [1] NCCL INFO Using network IB e08r3n02:30401:32525 [0] NCCL INFO Using network IB e08r3n08:13434:16175 [0] NCCL INFO Using network IB e08r3n03:22737:25417 [1] NCCL INFO Setting affinity for GPU 0 to ff00 e08r3n02:30403:32523 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n11:29647:32289 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n08:13436:16169 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n04:16936:19068 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n00:14536:16697 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n07:4891:7204 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n02:30405:32517 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n02:30404:32518 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n10:18788:21518 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n00:14535:16698 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n08:5142:8204 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n03:22739:25421 [3] NCCL INFO Setting affinity for GPU 0 to ff000000 e08r3n04:16939:19064 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n05:24731:27398 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n03:22738:25418 [2] NCCL INFO Setting affinity for GPU 0 to ff0000 e08r3n04:16940:19060 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n17:21284:23952 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n08:13437:16171 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n08:5136:8202 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n08:13438:16173 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n09:27006:29649 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n18:755:3474 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n06:22283:25009 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n05:24734:27392 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n05:24735:27390 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n01:6278:8493 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n09:8677:11336 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n17:21282:23955 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n10:875:3571 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n17:21283:23951 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n03:22735:25423 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n10:876:3570 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n07:4893:7208 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n19:9030:11813 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n18:754:3475 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n07:4892:7207 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n01:6279:8492 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n02:30401:32525 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n09:8675:11338 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n08:5141:8206 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n10:18786:21523 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n10:18784:21522 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n01:6277:8491 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n11:5733:8341 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n01:6275:8490 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n11:5732:8346 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n06:22281:25013 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n04:16938:19062 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n18:751:3479 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n00:14532:16701 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n18:753:3473 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n00:14534:16703 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n12:8673:11362 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n09:8679:11332 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n19:9032:11812 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n06:22285:25007 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n12:8675:11360 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n09:8678:11333 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n06:22284:25008 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n08:13434:16175 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n16:13446:16166 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n08:5140:8208 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n05:24733:27396 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n09:27004:29648 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r3n10:18787:21519 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n12:8674:11365 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n19:9033:11810 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r3n07:4889:7203 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n12:8671:11366 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n19:9034:11808 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n13:23995:26735 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r3n11:29649:32285 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n16:13445:16161 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n09:27005:29650 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n13:23991:26733 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n09:27002:29647 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n15:22021:24653 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n17:21280:23959 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n13:23994:26734 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n15:22025:24655 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n14:18195:20820 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n16:13442:16162 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n13:23993:26732 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n15:22024:24654 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n14:18196:20819 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n16:13444:16165 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n15:22023:24652 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n14:18192:20826 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n14:18194:20823 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n10:874:3574 [1] NCCL INFO Setting affinity for GPU 1 to ff00 e08r2n10:872:3576 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n11:29645:32290 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r3n11:29648:32286 [2] NCCL INFO Setting affinity for GPU 2 to ff0000 e08r2n11:5730:8342 [0] NCCL INFO Setting affinity for GPU 0 to ff e08r2n11:5734:8345 [3] NCCL INFO Setting affinity for GPU 3 to ff000000 e08r2n18:754:3475 [2] NCCL INFO Trees [0] 43/-1/-1->42->41 [1] 43/-1/-1->42->41 comm 0x2b2c8c000ab0 nRanks 96 busId 43000 e08r2n16:13446:16166 [3] NCCL INFO Trees [0] -1/-1/-1->35->34 [1] -1/-1/-1->35->34 comm 0x2ac21c000ab0 nRanks 96 busId 63000 e08r2n18:755:3474 [3] NCCL INFO Trees [0] -1/-1/-1->43->42 [1] -1/-1/-1->43->42 comm 0x2b8210000ab0 nRanks 96 busId 63000 e08r2n16:13445:16161 [2] NCCL INFO Trees [0] 35/-1/-1->34->33 [1] 35/-1/-1->34->33 comm 0x2b6a48000ab0 nRanks 96 busId 43000 e08r2n18:753:3473 [1] NCCL INFO Trees [0] 42/36/-1->41->40 [1] 42/-1/-1->41->40 comm 0x2b3358000ab0 nRanks 96 busId 26000 e08r2n18:751:3479 [0] NCCL INFO Trees [0] 41/44/-1->40->49 [1] 41/-1/-1->40->37 comm 0x2b8398000ab0 nRanks 96 busId 4000 e08r2n16:13444:16165 [1] NCCL INFO Trees [0] 34/16/-1->33->32 [1] 34/-1/-1->33->32 comm 0x2b03e8000ab0 nRanks 96 busId 26000 e08r2n15:22025:24655 [3] NCCL INFO Trees [0] -1/-1/-1->31->30 [1] -1/-1/-1->31->30 comm 0x2b3468000ab0 nRanks 96 busId 63000 e08r2n14:18195:20820 [2] NCCL INFO Trees [0] 27/-1/-1->26->25 [1] 27/-1/-1->26->25 comm 0x2b7728000ab0 nRanks 96 busId 43000 e08r2n16:13442:16162 [0] NCCL INFO Trees [0] 33/48/-1->32->65 [1] 33/-1/-1->32->36 comm 0x2b4c88000ab0 nRanks 96 busId 4000 e08r2n14:18196:20819 [3] NCCL INFO Trees [0] -1/-1/-1->27->26 [1] -1/-1/-1->27->26 comm 0x2ab848000ab0 nRanks 96 busId 63000 e08r2n17:21284:23952 [3] NCCL INFO Trees [0] -1/-1/-1->39->38 [1] -1/-1/-1->39->38 comm 0x2ba784000ab0 nRanks 96 busId 63000 e08r2n14:18194:20823 [1] NCCL INFO Trees [0] 26/20/-1->25->24 [1] 26/-1/-1->25->24 comm 0x2b4618000ab0 nRanks 96 busId 26000 e08r2n17:21283:23951 [2] NCCL INFO Trees [0] 39/-1/-1->38->37 [1] 39/-1/-1->38->37 comm 0x2b9988000ab0 nRanks 96 busId 43000 e08r2n19:9030:11813 [0] NCCL INFO Trees [0] 45/-1/-1->44->40 [1] 45/36/-1->44->60 comm 0x2ab5e8000ab0 nRanks 96 busId 4000 e08r2n15:22024:24654 [2] NCCL INFO Trees [0] 31/-1/-1->30->29 [1] 31/-1/-1->30->29 comm 0x2b14a0000ab0 nRanks 96 busId 43000 e08r2n13:23995:26735 [3] NCCL INFO Trees [0] -1/-1/-1->23->22 [1] -1/-1/-1->23->22 comm 0x2b4d6c000ab0 nRanks 96 busId 63000 e08r2n14:18192:20826 [0] NCCL INFO Trees [0] 25/28/-1->24->16 [1] 25/-1/-1->24->21 comm 0x2b8b18000ab0 nRanks 96 busId 4000 e08r2n17:21280:23959 [0] NCCL INFO Trees [0] 37/-1/-1->36->41 [1] 37/32/-1->36->44 comm 0x2b01f0000ab0 nRanks 96 busId 4000 e08r2n19:9032:11812 [1] NCCL INFO Trees [0] 46/-1/-1->45->44 [1] 46/52/-1->45->44 comm 0x2af85c000ab0 nRanks 96 busId 26000 e08r2n15:22021:24653 [0] NCCL INFO Trees [0] 29/-1/-1->28->24 [1] 29/12/-1->28->92 comm 0x2b5f80000ab0 nRanks 96 busId 4000 e08r2n13:23994:26734 [2] NCCL INFO Trees [0] 23/-1/-1->22->21 [1] 23/-1/-1->22->21 comm 0x2b5ff4000ab0 nRanks 96 busId 43000 e08r2n17:21282:23955 [1] NCCL INFO Trees [0] 38/-1/-1->37->36 [1] 38/40/-1->37->36 comm 0x2ac164000ab0 nRanks 96 busId 26000 e08r2n19:9034:11808 [3] NCCL INFO Trees [0] -1/-1/-1->47->46 [1] -1/-1/-1->47->46 comm 0x2b6ba4000ab0 nRanks 96 busId 63000 e08r2n15:22023:24652 [1] NCCL INFO Trees [0] 30/-1/-1->29->28 [1] 30/60/-1->29->28 comm 0x2ad720000ab0 nRanks 96 busId 26000 e08r2n13:23993:26732 [1] NCCL INFO Trees [0] 22/-1/-1->21->20 [1] 22/24/-1->21->20 comm 0x2b42c0000ab0 nRanks 96 busId 26000 e08r3n00:14534:16703 [1] NCCL INFO Trees [0] 50/40/-1->49->48 [1] 50/-1/-1->49->48 comm 0x2b8e34000ab0 nRanks 96 busId 26000 e08r2n19:9033:11810 [2] NCCL INFO Trees [0] 47/-1/-1->46->45 [1] 47/-1/-1->46->45 comm 0x2b0610000ab0 nRanks 96 busId 43000 e08r2n13:23991:26733 [0] NCCL INFO Trees [0] 21/-1/-1->20->25 [1] 21/16/-1->20->13 comm 0x2b51f4000ab0 nRanks 96 busId 4000 e08r3n00:14532:16701 [0] NCCL INFO Trees [0] 49/56/-1->48->32 [1] 49/-1/-1->48->52 comm 0x2ac0ac000ab0 nRanks 96 busId 4000 e08r2n11:5734:8345 [3] NCCL INFO Trees [0] -1/-1/-1->15->14 [1] -1/-1/-1->15->14 comm 0x2b4320000ab0 nRanks 96 busId 63000 e08r2n12:8673:11362 [1] NCCL INFO Trees [0] 18/8/-1->17->16 [1] 18/-1/-1->17->16 comm 0x2b951c000ab0 nRanks 96 busId 26000 e08r3n00:14536:16697 [3] NCCL INFO Trees [0] -1/-1/-1->51->50 [1] -1/-1/-1->51->50 comm 0x2b79d4000ab0 nRanks 96 busId 63000 e08r2n11:5733:8341 [2] NCCL INFO Trees [0] 15/-1/-1->14->13 [1] 15/-1/-1->14->13 comm 0x2ae954000ab0 nRanks 96 busId 43000 e08r2n12:8674:11365 [2] NCCL INFO Trees [0] 19/-1/-1->18->17 [1] 19/-1/-1->18->17 comm 0x2b6804000ab0 nRanks 96 busId 43000 e08r3n00:14535:16698 [2] NCCL INFO Trees [0] 51/-1/-1->50->49 [1] 51/-1/-1->50->49 comm 0x2bb1cc000ab0 nRanks 96 busId 43000 e08r2n12:8675:11360 [3] NCCL INFO Trees [0] -1/-1/-1->19->18 [1] -1/-1/-1->19->18 comm 0x2b3078000ab0 nRanks 96 busId 63000 e08r2n12:8671:11366 [0] NCCL INFO Trees [0] 17/24/-1->16->33 [1] 17/-1/-1->16->20 comm 0x2b6958000ab0 nRanks 96 busId 4000 e08r3n05:24735:27390 [3] NCCL INFO Trees [0] -1/-1/-1->71->70 [1] -1/-1/-1->71->70 comm 0x2ac47c000ab0 nRanks 96 busId 63000 e08r3n01:6277:8491 [1] NCCL INFO Trees [0] 54/-1/-1->53->52 [1] 54/56/-1->53->52 comm 0x2ba5b0000ab0 nRanks 96 busId 26000 e08r3n01:6275:8490 [0] NCCL INFO Trees [0] 53/-1/-1->52->57 [1] 53/48/-1->52->45 comm 0x2b899c000ab0 nRanks 96 busId 4000 e08r3n06:22283:25009 [1] NCCL INFO Trees [0] 74/68/-1->73->72 [1] 74/-1/-1->73->72 comm 0x2b9cec000ab0 nRanks 96 busId 26000 e08r3n01:6278:8493 [2] NCCL INFO Trees [0] 55/-1/-1->54->53 [1] 55/-1/-1->54->53 comm 0x2b1280000ab0 nRanks 96 busId 43000 e08r3n06:22285:25007 [3] NCCL INFO Trees [0] -1/-1/-1->75->74 [1] -1/-1/-1->75->74 comm 0x2b9418000ab0 nRanks 96 busId 63000 e08r3n06:22284:25008 [2] NCCL INFO Trees [0] 75/-1/-1->74->73 [1] 75/-1/-1->74->73 comm 0x2b15fc000ab0 nRanks 96 busId 43000 e08r3n06:22281:25013 [0] NCCL INFO Trees [0] 73/76/-1->72->81 [1] 73/-1/-1->72->69 comm 0x2afc48000ab0 nRanks 96 busId 4000 e08r3n01:6279:8492 [3] NCCL INFO Trees [0] -1/-1/-1->55->54 [1] -1/-1/-1->55->54 comm 0x2aecbc000ab0 nRanks 96 busId 63000 e08r3n02:30401:32525 [0] NCCL INFO Trees [0] 57/60/-1->56->48 [1] 57/-1/-1->56->53 comm 0x2badc0000ab0 nRanks 96 busId 4000 e08r3n05:24733:27396 [1] NCCL INFO Trees [0] 70/-1/-1->69->68 [1] 70/72/-1->69->68 comm 0x2abc38000ab0 nRanks 96 busId 26000 e08r3n07:4889:7203 [0] NCCL INFO Trees [0] 77/-1/-1->76->72 [1] 77/68/-1->76->61 comm 0x2aefdc000ab0 nRanks 96 busId 4000 e08r3n05:24734:27392 [2] NCCL INFO Trees [0] 71/-1/-1->70->69 [1] 71/-1/-1->70->69 comm 0x2b2914000ab0 nRanks 96 busId 43000 e08r3n07:4891:7204 [1] NCCL INFO Trees [0] 78/-1/-1->77->76 [1] 78/84/-1->77->76 comm 0x2b7cf8000ab0 nRanks 96 busId 26000 e08r3n02:30403:32523 [1] NCCL INFO Trees [0] 58/52/-1->57->56 [1] 58/-1/-1->57->56 comm 0x2ba378000ab0 nRanks 96 busId 26000 e08r3n05:24731:27398 [0] NCCL INFO Trees [0] 69/-1/-1->68->73 [1] 69/64/-1->68->76 comm 0x2b883c000ab0 nRanks 96 busId 4000 e08r3n07:4892:7207 [2] NCCL INFO Trees [0] 79/-1/-1->78->77 [1] 79/-1/-1->78->77 comm 0x2b98d4000ab0 nRanks 96 busId 43000 e08r3n02:30405:32517 [3] NCCL INFO Trees [0] -1/-1/-1->59->58 [1] -1/-1/-1->59->58 comm 0x2b6b88000ab0 nRanks 96 busId 63000 e08r3n03:22735:25423 [0] NCCL INFO Trees [0] 61/-1/-1->60->56 [1] 61/44/-1->60->29 comm 0x2b4768000ab0 nRanks 96 busId 4000 e08r2n08:5142:8204 [3] NCCL INFO Trees [0] -1/-1/-1->3->2 [1] -1/-1/-1->3->2 comm 0x2ad70c000ab0 nRanks 96 busId 63000 e08r3n07:4893:7208 [3] NCCL INFO Trees [0] -1/-1/-1->79->78 [1] -1/-1/-1->79->78 comm 0x2ba900000ab0 nRanks 96 busId 63000 e08r3n02:30404:32518 [2] NCCL INFO Trees [0] 59/-1/-1->58->57 [1] 59/-1/-1->58->57 comm 0x2b6a10000ab0 nRanks 96 busId 43000 e08r3n03:22737:25417 [1] NCCL INFO Trees [0] 62/-1/-1->61->60 [1] 62/76/-1->61->60 comm 0x2ac904000ab0 nRanks 96 busId 26000 e08r3n04:16940:19060 [3] NCCL INFO Trees [0] -1/-1/-1->67->66 [1] -1/-1/-1->67->66 comm 0x2b208c000ab0 nRanks 96 busId 63000 e08r2n10:876:3570 [3] NCCL INFO Trees [0] -1/-1/-1->11->10 [1] -1/-1/-1->11->10 comm 0x2b2f70000ab0 nRanks 96 busId 63000 e08r2n11:5730:8342 [0] NCCL INFO Trees [0] 13/-1/-1->12->8 [1] 13/4/-1->12->28 comm 0x2b7cc4000ab0 nRanks 96 busId 4000 e08r2n09:27006:29649 [3] NCCL INFO Trees [0] -1/-1/-1->7->6 [1] -1/-1/-1->7->6 comm 0x2b5948000ab0 nRanks 96 busId 63000 e08r2n08:5141:8206 [2] NCCL INFO Trees [0] 3/-1/-1->2->1 [1] 3/-1/-1->2->1 comm 0x2b5e3c000ab0 nRanks 96 busId 43000 e08r3n03:22738:25418 [2] NCCL INFO Trees [0] 63/-1/-1->62->61 [1] 63/-1/-1->62->61 comm 0x2af6a0000ab0 nRanks 96 busId 43000 e08r3n04:16939:19064 [2] NCCL INFO Trees [0] 67/-1/-1->66->65 [1] 67/-1/-1->66->65 comm 0x2b5118000ab0 nRanks 96 busId 43000 e08r2n10:872:3576 [0] NCCL INFO Trees [0] 9/12/-1->8->17 [1] 9/-1/-1->8->5 comm 0x2b62a4000ab0 nRanks 96 busId 4000 e08r2n11:5732:8346 [1] NCCL INFO Trees [0] 14/-1/-1->13->12 [1] 14/20/-1->13->12 comm 0x2b1404000ab0 nRanks 96 busId 26000 e08r2n09:27004:29648 [1] NCCL INFO Trees [0] 6/-1/-1->5->4 [1] 6/8/-1->5->4 comm 0x2af944000ab0 nRanks 96 busId 26000 e08r3n11:29649:32285 [3] NCCL INFO Trees [0] -1/-1/-1->95->94 [1] -1/-1/-1->95->94 comm 0x2ba94c000ab0 nRanks 96 busId 63000 e08r3n08:13434:16175 [0] NCCL INFO Trees [0] 81/88/-1->80->64 [1] 81/-1/-1->80->84 comm 0x2abf58000ab0 nRanks 96 busId 4000 e08r2n08:5136:8202 [0] NCCL INFO Channel 00/02 : 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 e08r2n08:5136:8202 [0] NCCL INFO Channel 01/02 : 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 e08r2n08:5136:8202 [0] NCCL INFO Trees [0] 1/64/-1->0->-1 [1] 1/-1/-1->0->4 comm 0x2b30a8000ab0 nRanks 96 busId 4000 e08r2n08:5140:8208 [1] NCCL INFO Trees [0] 2/-1/-1->1->0 [1] 2/-1/-1->1->0 comm 0x2b3330000ab0 nRanks 96 busId 26000 e08r3n03:22739:25421 [3] NCCL INFO Trees [0] -1/-1/-1->63->62 [1] -1/-1/-1->63->62 comm 0x2b0784000ab0 nRanks 96 busId 63000 e08r3n04:16938:19062 [1] NCCL INFO Trees [0] 66/32/-1->65->64 [1] 66/-1/-1->65->64 comm 0x2b0ddc000ab0 nRanks 96 busId 26000 e08r2n10:874:3574 [1] NCCL INFO Trees [0] 10/4/-1->9->8 [1] 10/-1/-1->9->8 comm 0x2b20f0000ab0 nRanks 96 busId 26000 e08r2n09:27005:29650 [2] NCCL INFO Trees [0] 7/-1/-1->6->5 [1] 7/-1/-1->6->5 comm 0x2b40ac000ab0 nRanks 96 busId 43000 e08r3n11:29648:32286 [2] NCCL INFO Trees [0] 95/-1/-1->94->93 [1] 95/-1/-1->94->93 comm 0x2b900c000ab0 nRanks 96 busId 43000 e08r3n08:13436:16169 [1] NCCL INFO Trees [0] 82/72/-1->81->80 [1] 82/-1/-1->81->80 comm 0x2b1bb8000ab0 nRanks 96 busId 26000 e08r3n09:8677:11336 [1] NCCL INFO Trees [0] 86/-1/-1->85->84 [1] 86/88/-1->85->84 comm 0x2b45a8000ab0 nRanks 96 busId 26000 e08r3n04:16936:19068 [0] NCCL INFO Trees [0] 65/80/-1->64->0 [1] 65/-1/-1->64->68 comm 0x2b37d8000ab0 nRanks 96 busId 4000 e08r2n10:875:3571 [2] NCCL INFO Trees [0] 11/-1/-1->10->9 [1] 11/-1/-1->10->9 comm 0x2afb28000ab0 nRanks 96 busId 43000 e08r2n09:27002:29647 [0] NCCL INFO Trees [0] 5/-1/-1->4->9 [1] 5/0/-1->4->12 comm 0x2b0f80000ab0 nRanks 96 busId 4000 e08r3n11:29647:32289 [1] NCCL INFO Trees [0] 94/-1/-1->93->92 [1] 94/-1/-1->93->92 comm 0x2abf74000ab0 nRanks 96 busId 26000 e08r3n08:13437:16171 [2] NCCL INFO Trees [0] 83/-1/-1->82->81 [1] 83/-1/-1->82->81 comm 0x2b919c000ab0 nRanks 96 busId 43000 e08r3n09:8678:11333 [2] NCCL INFO Trees [0] 87/-1/-1->86->85 [1] 87/-1/-1->86->85 comm 0x2b235c000ab0 nRanks 96 busId 43000 e08r3n10:18788:21518 [3] NCCL INFO Trees [0] -1/-1/-1->91->90 [1] -1/-1/-1->91->90 comm 0x2adaac000ab0 nRanks 96 busId 63000 e08r3n11:29645:32290 [0] NCCL INFO Trees [0] 93/-1/-1->92->88 [1] 93/28/-1->92->-1 comm 0x2ac49c000ab0 nRanks 96 busId 4000 e08r3n08:13438:16173 [3] NCCL INFO Trees [0] -1/-1/-1->83->82 [1] -1/-1/-1->83->82 comm 0x2b2878000ab0 nRanks 96 busId 63000 e08r3n09:8675:11338 [0] NCCL INFO Trees [0] 85/-1/-1->84->89 [1] 85/80/-1->84->77 comm 0x2b43d0000ab0 nRanks 96 busId 4000 e08r3n10:18787:21519 [2] NCCL INFO Trees [0] 91/-1/-1->90->89 [1] 91/-1/-1->90->89 comm 0x2ae928000ab0 nRanks 96 busId 43000 e08r3n09:8679:11332 [3] NCCL INFO Trees [0] -1/-1/-1->87->86 [1] -1/-1/-1->87->86 comm 0x2b0eac000ab0 nRanks 96 busId 63000 e08r3n10:18786:21523 [1] NCCL INFO Trees [0] 90/84/-1->89->88 [1] 90/-1/-1->89->88 comm 0x2ac5c0000ab0 nRanks 96 busId 26000 e08r3n10:18784:21522 [0] NCCL INFO Trees [0] 89/92/-1->88->80 [1] 89/-1/-1->88->85 comm 0x2af26c000ab0 nRanks 96 busId 4000 e08r2n17:21280:23959 [0] NCCL INFO Channel 00/0 : 35[63000] -> 36[4000] [receive] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00/0 : 39[63000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 00/0 : 31[63000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 00/0 : 43[63000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n16:13445:16161 [2] NCCL INFO Channel 00 : 34[43000] -> 35[63000] via P2P/IPC comm 0x2b6a48000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Channel 00 : 41[26000] -> 42[43000] via P2P/IPC comm 0x2b3358000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 00/0 : 27[63000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00/0 : 23[63000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 00/0 : 19[63000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n18:754:3475 [2] NCCL INFO Channel 00 : 42[43000] -> 43[63000] via P2P/IPC comm 0x2b2c8c000ab0 nRanks 96 e08r2n16:13444:16165 [1] NCCL INFO Channel 00 : 33[26000] -> 34[43000] via P2P/IPC comm 0x2b03e8000ab0 nRanks 96 e08r2n16:13445:16161 [2] NCCL INFO Channel 01 : 34[43000] -> 35[63000] via P2P/IPC comm 0x2b6a48000ab0 nRanks 96 e08r2n13:23994:26734 [2] NCCL INFO Channel 00 : 22[43000] -> 23[63000] via P2P/IPC comm 0x2b5ff4000ab0 nRanks 96 e08r2n14:18195:20820 [2] NCCL INFO Channel 00 : 26[43000] -> 27[63000] via P2P/IPC comm 0x2b7728000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 00 : 25[26000] -> 26[43000] via P2P/IPC comm 0x2b4618000ab0 nRanks 96 e08r2n19:9032:11812 [1] NCCL INFO Channel 00 : 45[26000] -> 46[43000] via P2P/IPC comm 0x2af85c000ab0 nRanks 96 e08r2n15:22023:24652 [1] NCCL INFO Channel 00 : 29[26000] -> 30[43000] via P2P/IPC comm 0x2ad720000ab0 nRanks 96 e08r2n17:21283:23951 [2] NCCL INFO Channel 00 : 38[43000] -> 39[63000] via P2P/IPC comm 0x2b9988000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 00/0 : 47[63000] -> 48[4000] [receive] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Channel 00 : 46[43000] -> 47[63000] via P2P/IPC comm 0x2b0610000ab0 nRanks 96 e08r2n15:22024:24654 [2] NCCL INFO Channel 00 : 30[43000] -> 31[63000] via P2P/IPC comm 0x2b14a0000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO Channel 00 : 37[26000] -> 38[43000] via P2P/IPC comm 0x2ac164000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 00 : 21[26000] -> 22[43000] via P2P/IPC comm 0x2b42c0000ab0 nRanks 96 e08r2n18:754:3475 [2] NCCL INFO Channel 01 : 42[43000] -> 43[63000] via P2P/IPC comm 0x2b2c8c000ab0 nRanks 96 e08r2n19:9032:11812 [1] NCCL INFO Channel 01 : 45[26000] -> 46[43000] via P2P/IPC comm 0x2af85c000ab0 nRanks 96 e08r2n13:23994:26734 [2] NCCL INFO Channel 01 : 22[43000] -> 23[63000] via P2P/IPC comm 0x2b5ff4000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Channel 01 : 41[26000] -> 42[43000] via P2P/IPC comm 0x2b3358000ab0 nRanks 96 e08r2n16:13444:16165 [1] NCCL INFO Channel 01 : 33[26000] -> 34[43000] via P2P/IPC comm 0x2b03e8000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00/0 : 15[63000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r2n14:18195:20820 [2] NCCL INFO Channel 01 : 26[43000] -> 27[63000] via P2P/IPC comm 0x2b7728000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Channel 01 : 46[43000] -> 47[63000] via P2P/IPC comm 0x2b0610000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 01 : 21[26000] -> 22[43000] via P2P/IPC comm 0x2b42c0000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 00 : 17[26000] -> 18[43000] via P2P/IPC comm 0x2b951c000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 01 : 25[26000] -> 26[43000] via P2P/IPC comm 0x2b4618000ab0 nRanks 96 e08r2n11:5733:8341 [2] NCCL INFO Channel 00 : 14[43000] -> 15[63000] via P2P/IPC comm 0x2ae954000ab0 nRanks 96 e08r3n00:14535:16698 [2] NCCL INFO Channel 00 : 50[43000] -> 51[63000] via P2P/IPC comm 0x2bb1cc000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 00/0 : 55[63000] -> 56[4000] [receive] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 00/0 : 75[63000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r2n15:22024:24654 [2] NCCL INFO Channel 01 : 30[43000] -> 31[63000] via P2P/IPC comm 0x2b14a0000ab0 nRanks 96 e08r2n12:8674:11365 [2] NCCL INFO Channel 00 : 18[43000] -> 19[63000] via P2P/IPC comm 0x2b6804000ab0 nRanks 96 e08r2n11:5733:8341 [2] NCCL INFO Channel 01 : 14[43000] -> 15[63000] via P2P/IPC comm 0x2ae954000ab0 nRanks 96 e08r3n00:14534:16703 [1] NCCL INFO Channel 00 : 49[26000] -> 50[43000] via P2P/IPC comm 0x2b8e34000ab0 nRanks 96 e08r2n15:22023:24652 [1] NCCL INFO Channel 01 : 29[26000] -> 30[43000] via P2P/IPC comm 0x2ad720000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 00/0 : 51[63000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 00/0 : 59[63000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO Channel 01 : 37[26000] -> 38[43000] via P2P/IPC comm 0x2ac164000ab0 nRanks 96 e08r3n05:24733:27396 [1] NCCL INFO Channel 00 : 69[26000] -> 70[43000] via P2P/IPC comm 0x2abc38000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00/0 : 71[63000] -> 72[4000] [receive] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r2n12:8674:11365 [2] NCCL INFO Channel 01 : 18[43000] -> 19[63000] via P2P/IPC comm 0x2b6804000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 00/0 : 11[63000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r3n00:14535:16698 [2] NCCL INFO Channel 01 : 50[43000] -> 51[63000] via P2P/IPC comm 0x2bb1cc000ab0 nRanks 96 e08r3n01:6277:8491 [1] NCCL INFO Channel 00 : 53[26000] -> 54[43000] via P2P/IPC comm 0x2ba5b0000ab0 nRanks 96 e08r2n17:21283:23951 [2] NCCL INFO Channel 01 : 38[43000] -> 39[63000] via P2P/IPC comm 0x2b9988000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 00/0 : 67[63000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Channel 00 : 74[43000] -> 75[63000] via P2P/IPC comm 0x2b15fc000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00/0 : 7[63000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00/0 : 79[63000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r3n07:4892:7207 [2] NCCL INFO Channel 00 : 78[43000] -> 79[63000] via P2P/IPC comm 0x2b98d4000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 00/0 : 95[63000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 01 : 17[26000] -> 18[43000] via P2P/IPC comm 0x2b951c000ab0 nRanks 96 e08r3n00:14534:16703 [1] NCCL INFO Channel 01 : 49[26000] -> 50[43000] via P2P/IPC comm 0x2b8e34000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Channel 00 : 54[43000] -> 55[63000] via P2P/IPC comm 0x2b1280000ab0 nRanks 96 e08r3n05:24734:27392 [2] NCCL INFO Channel 00 : 70[43000] -> 71[63000] via P2P/IPC comm 0x2b2914000ab0 nRanks 96 e08r3n06:22283:25009 [1] NCCL INFO Channel 00 : 73[26000] -> 74[43000] via P2P/IPC comm 0x2b9cec000ab0 nRanks 96 e08r2n10:874:3574 [1] NCCL INFO Channel 00 : 9[26000] -> 10[43000] via P2P/IPC comm 0x2b20f0000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 00 : 77[26000] -> 78[43000] via P2P/IPC comm 0x2b7cf8000ab0 nRanks 96 e08r3n03:22737:25417 [1] NCCL INFO Channel 00 : 61[26000] -> 62[43000] via P2P/IPC comm 0x2ac904000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 00/0 : 63[63000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n02:30404:32518 [2] NCCL INFO Channel 00 : 58[43000] -> 59[63000] via P2P/IPC comm 0x2b6a10000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 00/0 : 3[63000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 00/0 : 91[63000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r2n08:5140:8208 [1] NCCL INFO Channel 00 : 1[26000] -> 2[43000] via P2P/IPC comm 0x2b3330000ab0 nRanks 96 e08r2n08:5140:8208 [1] NCCL INFO Channel 01 : 1[26000] -> 2[43000] via P2P/IPC comm 0x2b3330000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Channel 00 : 2[43000] -> 3[63000] via P2P/IPC comm 0x2b5e3c000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Channel 01 : 54[43000] -> 55[63000] via P2P/IPC comm 0x2b1280000ab0 nRanks 96 e08r3n05:24733:27396 [1] NCCL INFO Channel 01 : 69[26000] -> 70[43000] via P2P/IPC comm 0x2abc38000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Channel 01 : 74[43000] -> 75[63000] via P2P/IPC comm 0x2b15fc000ab0 nRanks 96 e08r2n10:875:3571 [2] NCCL INFO Channel 00 : 10[43000] -> 11[63000] via P2P/IPC comm 0x2afb28000ab0 nRanks 96 e08r3n07:4892:7207 [2] NCCL INFO Channel 01 : 78[43000] -> 79[63000] via P2P/IPC comm 0x2b98d4000ab0 nRanks 96 e08r3n03:22738:25418 [2] NCCL INFO Channel 00 : 62[43000] -> 63[63000] via P2P/IPC comm 0x2af6a0000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 00 : 65[26000] -> 66[43000] via P2P/IPC comm 0x2b0ddc000ab0 nRanks 96 e08r3n02:30403:32523 [1] NCCL INFO Channel 00 : 57[26000] -> 58[43000] via P2P/IPC comm 0x2ba378000ab0 nRanks 96 e08r2n09:27004:29648 [1] NCCL INFO Channel 00 : 5[26000] -> 6[43000] via P2P/IPC comm 0x2af944000ab0 nRanks 96 e08r3n11:29648:32286 [2] NCCL INFO Channel 00 : 94[43000] -> 95[63000] via P2P/IPC comm 0x2b900c000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 00 : 13[26000] -> 14[43000] via P2P/IPC comm 0x2b1404000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 00/0 : 83[63000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00/0 : 87[63000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n01:6277:8491 [1] NCCL INFO Channel 01 : 53[26000] -> 54[43000] via P2P/IPC comm 0x2ba5b0000ab0 nRanks 96 e08r3n05:24734:27392 [2] NCCL INFO Channel 01 : 70[43000] -> 71[63000] via P2P/IPC comm 0x2b2914000ab0 nRanks 96 e08r3n06:22283:25009 [1] NCCL INFO Channel 01 : 73[26000] -> 74[43000] via P2P/IPC comm 0x2b9cec000ab0 nRanks 96 e08r2n10:875:3571 [2] NCCL INFO Channel 01 : 10[43000] -> 11[63000] via P2P/IPC comm 0x2afb28000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 01 : 77[26000] -> 78[43000] via P2P/IPC comm 0x2b7cf8000ab0 nRanks 96 e08r3n03:22737:25417 [1] NCCL INFO Channel 01 : 61[26000] -> 62[43000] via P2P/IPC comm 0x2ac904000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Channel 00 : 66[43000] -> 67[63000] via P2P/IPC comm 0x2b5118000ab0 nRanks 96 e08r3n02:30404:32518 [2] NCCL INFO Channel 01 : 58[43000] -> 59[63000] via P2P/IPC comm 0x2b6a10000ab0 nRanks 96 e08r2n09:27005:29650 [2] NCCL INFO Channel 00 : 6[43000] -> 7[63000] via P2P/IPC comm 0x2b40ac000ab0 nRanks 96 e08r3n11:29647:32289 [1] NCCL INFO Channel 00 : 93[26000] -> 94[43000] via P2P/IPC comm 0x2abf74000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 01 : 13[26000] -> 14[43000] via P2P/IPC comm 0x2b1404000ab0 nRanks 96 e08r3n09:8677:11336 [1] NCCL INFO Channel 00 : 85[26000] -> 86[43000] via P2P/IPC comm 0x2b45a8000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 00 : 89[26000] -> 90[43000] via P2P/IPC comm 0x2ac5c0000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Channel 00 : 82[43000] -> 83[63000] via P2P/IPC comm 0x2b919c000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Channel 01 : 2[43000] -> 3[63000] via P2P/IPC comm 0x2b5e3c000ab0 nRanks 96 e08r2n10:874:3574 [1] NCCL INFO Channel 01 : 9[26000] -> 10[43000] via P2P/IPC comm 0x2b20f0000ab0 nRanks 96 e08r3n03:22738:25418 [2] NCCL INFO Channel 01 : 62[43000] -> 63[63000] via P2P/IPC comm 0x2af6a0000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 01 : 65[26000] -> 66[43000] via P2P/IPC comm 0x2b0ddc000ab0 nRanks 96 e08r3n02:30403:32523 [1] NCCL INFO Channel 01 : 57[26000] -> 58[43000] via P2P/IPC comm 0x2ba378000ab0 nRanks 96 e08r2n09:27005:29650 [2] NCCL INFO Channel 01 : 6[43000] -> 7[63000] via P2P/IPC comm 0x2b40ac000ab0 nRanks 96 e08r3n11:29648:32286 [2] NCCL INFO Channel 01 : 94[43000] -> 95[63000] via P2P/IPC comm 0x2b900c000ab0 nRanks 96 e08r3n09:8678:11333 [2] NCCL INFO Channel 00 : 86[43000] -> 87[63000] via P2P/IPC comm 0x2b235c000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Channel 00 : 90[43000] -> 91[63000] via P2P/IPC comm 0x2ae928000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 00 : 81[26000] -> 82[43000] via P2P/IPC comm 0x2b1bb8000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Channel 01 : 66[43000] -> 67[63000] via P2P/IPC comm 0x2b5118000ab0 nRanks 96 e08r2n09:27004:29648 [1] NCCL INFO Channel 01 : 5[26000] -> 6[43000] via P2P/IPC comm 0x2af944000ab0 nRanks 96 e08r3n11:29647:32289 [1] NCCL INFO Channel 01 : 93[26000] -> 94[43000] via P2P/IPC comm 0x2abf74000ab0 nRanks 96 e08r3n09:8677:11336 [1] NCCL INFO Channel 01 : 85[26000] -> 86[43000] via P2P/IPC comm 0x2b45a8000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 01 : 89[26000] -> 90[43000] via P2P/IPC comm 0x2ac5c0000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Channel 01 : 82[43000] -> 83[63000] via P2P/IPC comm 0x2b919c000ab0 nRanks 96 e08r3n09:8678:11333 [2] NCCL INFO Channel 01 : 86[43000] -> 87[63000] via P2P/IPC comm 0x2b235c000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Channel 01 : 90[43000] -> 91[63000] via P2P/IPC comm 0x2ae928000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 01 : 81[26000] -> 82[43000] via P2P/IPC comm 0x2b1bb8000ab0 nRanks 96 e08r2n18:755:3474 [3] NCCL INFO Channel 00/0 : 43[63000] -> 44[4000] [send] via NET/IB/0 comm 0x2b8210000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO Channel 00/0 : 31[63000] -> 32[4000] [send] via NET/IB/0 comm 0x2b3468000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01/0 : 27[63000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 01/0 : 39[63000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00 : 40[4000] -> 41[26000] via P2P/IPC comm 0x2b8398000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 00 : 28[4000] -> 29[26000] via P2P/IPC comm 0x2b5f80000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01 : 28[4000] -> 29[26000] via P2P/IPC comm 0x2b5f80000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 01 : 40[4000] -> 41[26000] via P2P/IPC comm 0x2b8398000ab0 nRanks 96 e08r2n11:5734:8345 [3] NCCL INFO Channel 00/0 : 15[63000] -> 16[4000] [send] via NET/IB/0 comm 0x2b4320000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01/0 : 51[63000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 00 : 52[4000] -> 53[26000] via P2P/IPC comm 0x2b899c000ab0 nRanks 96 e08r2n14:18196:20819 [3] NCCL INFO Channel 00/0 : 27[63000] -> 28[4000] [send] via NET/IB/0 comm 0x2ab848000ab0 nRanks 96 e08r2n16:13446:16166 [3] NCCL INFO Channel 00/0 : 35[63000] -> 36[4000] [send] via NET/IB/0 comm 0x2ac21c000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 01/0 : 23[63000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00 : 24[4000] -> 25[26000] via P2P/IPC comm 0x2b8b18000ab0 nRanks 96 e08r2n17:21284:23952 [3] NCCL INFO Channel 00/0 : 39[63000] -> 40[4000] [send] via NET/IB/0 comm 0x2ba784000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01/0 : 35[63000] -> 36[4000] [receive] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 01/0 : 31[63000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 00 : 36[4000] -> 37[26000] via P2P/IPC comm 0x2b01f0000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 00 : 32[4000] -> 33[26000] via P2P/IPC comm 0x2b4c88000ab0 nRanks 96 e08r2n19:9034:11808 [3] NCCL INFO Channel 00/0 : 47[63000] -> 48[4000] [send] via NET/IB/0 comm 0x2b6ba4000ab0 nRanks 96 e08r3n00:14536:16697 [3] NCCL INFO Channel 00/0 : 51[63000] -> 52[4000] [send] via NET/IB/0 comm 0x2b79d4000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01/0 : 43[63000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 00 : 44[4000] -> 45[26000] via P2P/IPC comm 0x2ab5e8000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 01/0 : 47[63000] -> 48[4000] [receive] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r2n13:23995:26735 [3] NCCL INFO Channel 00/0 : 23[63000] -> 24[4000] [send] via NET/IB/0 comm 0x2b4d6c000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 00 : 48[4000] -> 49[26000] via P2P/IPC comm 0x2ac0ac000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01/0 : 19[63000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 01/0 : 7[63000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00 : 8[4000] -> 9[26000] via P2P/IPC comm 0x2b62a4000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 00 : 20[4000] -> 21[26000] via P2P/IPC comm 0x2b51f4000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01 : 52[4000] -> 53[26000] via P2P/IPC comm 0x2b899c000ab0 nRanks 96 e08r2n12:8675:11360 [3] NCCL INFO Channel 00/0 : 19[63000] -> 20[4000] [send] via NET/IB/0 comm 0x2b3078000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 01/0 : 15[63000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 01 : 32[4000] -> 33[26000] via P2P/IPC comm 0x2b4c88000ab0 nRanks 96 e08r3n07:4893:7208 [3] NCCL INFO Channel 00/0 : 79[63000] -> 80[4000] [send] via NET/IB/0 comm 0x2ba900000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00 : 16[4000] -> 17[26000] via P2P/IPC comm 0x2b6958000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01 : 44[4000] -> 45[26000] via P2P/IPC comm 0x2ab5e8000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01 : 36[4000] -> 37[26000] via P2P/IPC comm 0x2b01f0000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01/0 : 75[63000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r3n04:16940:19060 [3] NCCL INFO Channel 00/0 : 67[63000] -> 68[4000] [send] via NET/IB/0 comm 0x2b208c000ab0 nRanks 96 e08r3n02:30405:32517 [3] NCCL INFO Channel 00/0 : 59[63000] -> 60[4000] [send] via NET/IB/0 comm 0x2b6b88000ab0 nRanks 96 e08r3n11:29649:32285 [3] NCCL INFO Channel 00/0 : 95[63000] -> 0[4000] [send] via NET/IB/0 comm 0x2ba94c000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 00 : 76[4000] -> 77[26000] via P2P/IPC comm 0x2aefdc000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 01/0 : 63[63000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 01/0 : 55[63000] -> 56[4000] [receive] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 01/0 : 91[63000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 01 : 24[4000] -> 25[26000] via P2P/IPC comm 0x2b8b18000ab0 nRanks 96 e08r3n05:24735:27390 [3] NCCL INFO Channel 00/0 : 71[63000] -> 72[4000] [send] via NET/IB/0 comm 0x2ac47c000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 01 : 8[4000] -> 9[26000] via P2P/IPC comm 0x2b62a4000ab0 nRanks 96 e08r2n08:5142:8204 [3] NCCL INFO Channel 00/0 : 3[63000] -> 4[4000] [send] via NET/IB/0 comm 0x2ad70c000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 01/0 : 95[63000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 00 : 0[4000] -> 1[26000] via P2P/IPC comm 0x2b30a8000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 00 : 64[4000] -> 65[26000] via P2P/IPC comm 0x2b37d8000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 00 : 56[4000] -> 57[26000] via P2P/IPC comm 0x2badc0000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 00 : 92[4000] -> 93[26000] via P2P/IPC comm 0x2ac49c000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01/0 : 67[63000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 00 : 68[4000] -> 69[26000] via P2P/IPC comm 0x2b883c000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 01 : 48[4000] -> 49[26000] via P2P/IPC comm 0x2ac0ac000ab0 nRanks 96 e08r3n09:8679:11332 [3] NCCL INFO Channel 00/0 : 87[63000] -> 88[4000] [send] via NET/IB/0 comm 0x2b0eac000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO Channel 00/0 : 75[63000] -> 76[4000] [send] via NET/IB/0 comm 0x2b9418000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01 : 20[4000] -> 21[26000] via P2P/IPC comm 0x2b51f4000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 01 : 64[4000] -> 65[26000] via P2P/IPC comm 0x2b37d8000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 01 : 56[4000] -> 57[26000] via P2P/IPC comm 0x2badc0000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01 : 68[4000] -> 69[26000] via P2P/IPC comm 0x2b883c000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01/0 : 83[63000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 00 : 84[4000] -> 85[26000] via P2P/IPC comm 0x2b43d0000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 01/0 : 71[63000] -> 72[4000] [receive] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00 : 72[4000] -> 73[26000] via P2P/IPC comm 0x2afc48000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01/0 : 11[63000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r3n01:6279:8492 [3] NCCL INFO Channel 00/0 : 55[63000] -> 56[4000] [send] via NET/IB/0 comm 0x2aecbc000ab0 nRanks 96 e08r3n03:22739:25421 [3] NCCL INFO Channel 00/0 : 63[63000] -> 64[4000] [send] via NET/IB/0 comm 0x2b0784000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01 : 76[4000] -> 77[26000] via P2P/IPC comm 0x2aefdc000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 01 : 16[4000] -> 17[26000] via P2P/IPC comm 0x2b6958000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 01/0 : 79[63000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00 : 80[4000] -> 81[26000] via P2P/IPC comm 0x2abf58000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 01 : 0[4000] -> 1[26000] via P2P/IPC comm 0x2b30a8000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01 : 84[4000] -> 85[26000] via P2P/IPC comm 0x2b43d0000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 01 : 72[4000] -> 73[26000] via P2P/IPC comm 0x2afc48000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 00 : 12[4000] -> 13[26000] via P2P/IPC comm 0x2b7cc4000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01/0 : 59[63000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 00 : 60[4000] -> 61[26000] via P2P/IPC comm 0x2b4768000ab0 nRanks 96 e08r3n10:18788:21518 [3] NCCL INFO Channel 00/0 : 91[63000] -> 92[4000] [send] via NET/IB/0 comm 0x2adaac000ab0 nRanks 96 e08r2n10:876:3570 [3] NCCL INFO Channel 00/0 : 11[63000] -> 12[4000] [send] via NET/IB/0 comm 0x2b2f70000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 01 : 92[4000] -> 93[26000] via P2P/IPC comm 0x2ac49c000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01 : 12[4000] -> 13[26000] via P2P/IPC comm 0x2b7cc4000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01 : 60[4000] -> 61[26000] via P2P/IPC comm 0x2b4768000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 01/0 : 87[63000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00 : 88[4000] -> 89[26000] via P2P/IPC comm 0x2af26c000ab0 nRanks 96 e08r2n09:27006:29649 [3] NCCL INFO Channel 00/0 : 7[63000] -> 8[4000] [send] via NET/IB/0 comm 0x2b5948000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 01 : 80[4000] -> 81[26000] via P2P/IPC comm 0x2abf58000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 01 : 88[4000] -> 89[26000] via P2P/IPC comm 0x2af26c000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01/0 : 3[63000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 00 : 4[4000] -> 5[26000] via P2P/IPC comm 0x2b0f80000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01 : 4[4000] -> 5[26000] via P2P/IPC comm 0x2b0f80000ab0 nRanks 96 e08r3n08:13438:16173 [3] NCCL INFO Channel 00/0 : 83[63000] -> 84[4000] [send] via NET/IB/0 comm 0x2b2878000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Connected all rings comm 0x2b3358000ab0 nRanks 96 busId 26000 e08r2n15:22023:24652 [1] NCCL INFO Connected all rings comm 0x2ad720000ab0 nRanks 96 busId 26000 e08r2n15:22023:24652 [1] NCCL INFO Channel 01/0 : 29[26000] -> 60[4000] [send] via NET/IB/0 comm 0x2ad720000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Channel 00/0 : 36[4000] -> 41[26000] [receive] via NET/IB/0 comm 0x2b3358000ab0 nRanks 96 e08r2n19:9032:11812 [1] NCCL INFO Connected all rings comm 0x2af85c000ab0 nRanks 96 busId 26000 e08r2n16:13444:16165 [1] NCCL INFO Connected all rings comm 0x2b03e8000ab0 nRanks 96 busId 26000 e08r2n14:18194:20823 [1] NCCL INFO Connected all rings comm 0x2b4618000ab0 nRanks 96 busId 26000 e08r3n00:14534:16703 [1] NCCL INFO Connected all rings comm 0x2b8e34000ab0 nRanks 96 busId 26000 e08r3n01:6277:8491 [1] NCCL INFO Connected all rings comm 0x2ba5b0000ab0 nRanks 96 busId 26000 e08r2n10:874:3574 [1] NCCL INFO Connected all rings comm 0x2b20f0000ab0 nRanks 96 busId 26000 e08r2n13:23993:26732 [1] NCCL INFO Connected all rings comm 0x2b42c0000ab0 nRanks 96 busId 26000 e08r2n19:9032:11812 [1] NCCL INFO Channel 01/0 : 45[26000] -> 52[4000] [send] via NET/IB/0 comm 0x2af85c000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO Connected all rings comm 0x2ac164000ab0 nRanks 96 busId 26000 e08r2n12:8673:11362 [1] NCCL INFO Connected all rings comm 0x2b951c000ab0 nRanks 96 busId 26000 e08r3n04:16938:19062 [1] NCCL INFO Connected all rings comm 0x2b0ddc000ab0 nRanks 96 busId 26000 e08r3n02:30403:32523 [1] NCCL INFO Connected all rings comm 0x2ba378000ab0 nRanks 96 busId 26000 e08r3n05:24733:27396 [1] NCCL INFO Connected all rings comm 0x2abc38000ab0 nRanks 96 busId 26000 e08r2n16:13444:16165 [1] NCCL INFO Channel 00/0 : 16[4000] -> 33[26000] [receive] via NET/IB/0 comm 0x2b03e8000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 00/0 : 20[4000] -> 25[26000] [receive] via NET/IB/0 comm 0x2b4618000ab0 nRanks 96 e08r3n01:6277:8491 [1] NCCL INFO Channel 01/0 : 53[26000] -> 56[4000] [send] via NET/IB/0 comm 0x2ba5b0000ab0 nRanks 96 e08r3n11:29647:32289 [1] NCCL INFO Connected all rings comm 0x2abf74000ab0 nRanks 96 busId 26000 e08r3n00:14534:16703 [1] NCCL INFO Channel 00/0 : 40[4000] -> 49[26000] [receive] via NET/IB/0 comm 0x2b8e34000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 01/0 : 21[26000] -> 24[4000] [send] via NET/IB/0 comm 0x2b42c0000ab0 nRanks 96 e08r2n08:5140:8208 [1] NCCL INFO Connected all rings comm 0x2b3330000ab0 nRanks 96 busId 26000 e08r2n10:874:3574 [1] NCCL INFO Channel 00/0 : 4[4000] -> 9[26000] [receive] via NET/IB/0 comm 0x2b20f0000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Connected all rings comm 0x2b1bb8000ab0 nRanks 96 busId 26000 e08r2n11:5732:8346 [1] NCCL INFO Connected all rings comm 0x2b1404000ab0 nRanks 96 busId 26000 e08r3n03:22737:25417 [1] NCCL INFO Connected all rings comm 0x2ac904000ab0 nRanks 96 busId 26000 e08r2n17:21282:23955 [1] NCCL INFO Channel 01/0 : 37[26000] -> 40[4000] [send] via NET/IB/0 comm 0x2ac164000ab0 nRanks 96 e08r3n05:24733:27396 [1] NCCL INFO Channel 01/0 : 69[26000] -> 72[4000] [send] via NET/IB/0 comm 0x2abc38000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 00/0 : 32[4000] -> 65[26000] [receive] via NET/IB/0 comm 0x2b0ddc000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 00/0 : 8[4000] -> 17[26000] [receive] via NET/IB/0 comm 0x2b951c000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Connected all rings comm 0x2b7cf8000ab0 nRanks 96 busId 26000 e08r3n02:30403:32523 [1] NCCL INFO Channel 00/0 : 52[4000] -> 57[26000] [receive] via NET/IB/0 comm 0x2ba378000ab0 nRanks 96 e08r3n09:8677:11336 [1] NCCL INFO Connected all rings comm 0x2b45a8000ab0 nRanks 96 busId 26000 e08r2n09:27004:29648 [1] NCCL INFO Connected all rings comm 0x2af944000ab0 nRanks 96 busId 26000 e08r3n06:22283:25009 [1] NCCL INFO Connected all rings comm 0x2b9cec000ab0 nRanks 96 busId 26000 e08r3n03:22737:25417 [1] NCCL INFO Channel 01/0 : 61[26000] -> 76[4000] [send] via NET/IB/0 comm 0x2ac904000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 01/0 : 13[26000] -> 20[4000] [send] via NET/IB/0 comm 0x2b1404000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Connected all rings comm 0x2ac5c0000ab0 nRanks 96 busId 26000 e08r2n08:5140:8208 [1] NCCL INFO Channel 00 : 1[26000] -> 0[4000] via P2P/IPC comm 0x2b3330000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 01/0 : 77[26000] -> 84[4000] [send] via NET/IB/0 comm 0x2b7cf8000ab0 nRanks 96 e08r3n11:29647:32289 [1] NCCL INFO Channel 00 : 93[26000] -> 92[4000] via P2P/IPC comm 0x2abf74000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 00/0 : 72[4000] -> 81[26000] [receive] via NET/IB/0 comm 0x2b1bb8000ab0 nRanks 96 e08r2n09:27004:29648 [1] NCCL INFO Channel 01/0 : 5[26000] -> 8[4000] [send] via NET/IB/0 comm 0x2af944000ab0 nRanks 96 e08r3n09:8677:11336 [1] NCCL INFO Channel 01/0 : 85[26000] -> 88[4000] [send] via NET/IB/0 comm 0x2b45a8000ab0 nRanks 96 e08r2n08:5140:8208 [1] NCCL INFO Channel 01 : 1[26000] -> 0[4000] via P2P/IPC comm 0x2b3330000ab0 nRanks 96 e08r3n11:29647:32289 [1] NCCL INFO Channel 01 : 93[26000] -> 92[4000] via P2P/IPC comm 0x2abf74000ab0 nRanks 96 e08r3n06:22283:25009 [1] NCCL INFO Channel 00/0 : 68[4000] -> 73[26000] [receive] via NET/IB/0 comm 0x2b9cec000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 00/0 : 84[4000] -> 89[26000] [receive] via NET/IB/0 comm 0x2ac5c0000ab0 nRanks 96 e08r2n18:755:3474 [3] NCCL INFO Channel 01/0 : 43[63000] -> 44[4000] [send] via NET/IB/0 comm 0x2b8210000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO Channel 01/0 : 31[63000] -> 32[4000] [send] via NET/IB/0 comm 0x2b3468000ab0 nRanks 96 e08r2n11:5734:8345 [3] NCCL INFO Channel 01/0 : 15[63000] -> 16[4000] [send] via NET/IB/0 comm 0x2b4320000ab0 nRanks 96 e08r2n14:18196:20819 [3] NCCL INFO Channel 01/0 : 27[63000] -> 28[4000] [send] via NET/IB/0 comm 0x2ab848000ab0 nRanks 96 e08r2n16:13446:16166 [3] NCCL INFO Channel 01/0 : 35[63000] -> 36[4000] [send] via NET/IB/0 comm 0x2ac21c000ab0 nRanks 96 e08r2n17:21284:23952 [3] NCCL INFO Channel 01/0 : 39[63000] -> 40[4000] [send] via NET/IB/0 comm 0x2ba784000ab0 nRanks 96 e08r3n00:14536:16697 [3] NCCL INFO Channel 01/0 : 51[63000] -> 52[4000] [send] via NET/IB/0 comm 0x2b79d4000ab0 nRanks 96 e08r2n19:9034:11808 [3] NCCL INFO Channel 01/0 : 47[63000] -> 48[4000] [send] via NET/IB/0 comm 0x2b6ba4000ab0 nRanks 96 e08r2n13:23995:26735 [3] NCCL INFO Channel 01/0 : 23[63000] -> 24[4000] [send] via NET/IB/0 comm 0x2b4d6c000ab0 nRanks 96 e08r2n12:8675:11360 [3] NCCL INFO Channel 01/0 : 19[63000] -> 20[4000] [send] via NET/IB/0 comm 0x2b3078000ab0 nRanks 96 e08r3n07:4893:7208 [3] NCCL INFO Channel 01/0 : 79[63000] -> 80[4000] [send] via NET/IB/0 comm 0x2ba900000ab0 nRanks 96 e08r3n02:30405:32517 [3] NCCL INFO Channel 01/0 : 59[63000] -> 60[4000] [send] via NET/IB/0 comm 0x2b6b88000ab0 nRanks 96 e08r3n04:16940:19060 [3] NCCL INFO Channel 01/0 : 67[63000] -> 68[4000] [send] via NET/IB/0 comm 0x2b208c000ab0 nRanks 96 e08r3n05:24735:27390 [3] NCCL INFO Channel 01/0 : 71[63000] -> 72[4000] [send] via NET/IB/0 comm 0x2ac47c000ab0 nRanks 96 e08r3n11:29649:32285 [3] NCCL INFO Channel 01/0 : 95[63000] -> 0[4000] [send] via NET/IB/0 comm 0x2ba94c000ab0 nRanks 96 e08r2n08:5142:8204 [3] NCCL INFO Channel 01/0 : 3[63000] -> 4[4000] [send] via NET/IB/0 comm 0x2ad70c000ab0 nRanks 96 e08r3n09:8679:11332 [3] NCCL INFO Channel 01/0 : 87[63000] -> 88[4000] [send] via NET/IB/0 comm 0x2b0eac000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO Channel 01/0 : 75[63000] -> 76[4000] [send] via NET/IB/0 comm 0x2b9418000ab0 nRanks 96 e08r3n03:22739:25421 [3] NCCL INFO Channel 01/0 : 63[63000] -> 64[4000] [send] via NET/IB/0 comm 0x2b0784000ab0 nRanks 96 e08r3n01:6279:8492 [3] NCCL INFO Channel 01/0 : 55[63000] -> 56[4000] [send] via NET/IB/0 comm 0x2aecbc000ab0 nRanks 96 e08r3n10:18788:21518 [3] NCCL INFO Channel 01/0 : 91[63000] -> 92[4000] [send] via NET/IB/0 comm 0x2adaac000ab0 nRanks 96 e08r2n10:876:3570 [3] NCCL INFO Channel 01/0 : 11[63000] -> 12[4000] [send] via NET/IB/0 comm 0x2b2f70000ab0 nRanks 96 e08r2n09:27006:29649 [3] NCCL INFO Channel 01/0 : 7[63000] -> 8[4000] [send] via NET/IB/0 comm 0x2b5948000ab0 nRanks 96 e08r2n18:754:3475 [2] NCCL INFO Connected all rings comm 0x2b2c8c000ab0 nRanks 96 busId 43000 e08r2n15:22024:24654 [2] NCCL INFO Connected all rings comm 0x2b14a0000ab0 nRanks 96 busId 43000 e08r2n11:5733:8341 [2] NCCL INFO Connected all rings comm 0x2ae954000ab0 nRanks 96 busId 43000 e08r3n08:13438:16173 [3] NCCL INFO Channel 01/0 : 83[63000] -> 84[4000] [send] via NET/IB/0 comm 0x2b2878000ab0 nRanks 96 e08r2n16:13445:16161 [2] NCCL INFO Connected all rings comm 0x2b6a48000ab0 nRanks 96 busId 43000 e08r2n15:22024:24654 [2] NCCL INFO Channel 00 : 30[43000] -> 29[26000] via P2P/IPC comm 0x2b14a0000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Connected all rings comm 0x2b0610000ab0 nRanks 96 busId 43000 e08r3n00:14535:16698 [2] NCCL INFO Connected all rings comm 0x2bb1cc000ab0 nRanks 96 busId 43000 e08r2n18:754:3475 [2] NCCL INFO Channel 00 : 42[43000] -> 41[26000] via P2P/IPC comm 0x2b2c8c000ab0 nRanks 96 e08r2n17:21283:23951 [2] NCCL INFO Connected all rings comm 0x2b9988000ab0 nRanks 96 busId 43000 e08r2n13:23994:26734 [2] NCCL INFO Connected all rings comm 0x2b5ff4000ab0 nRanks 96 busId 43000 e08r2n12:8674:11365 [2] NCCL INFO Connected all rings comm 0x2b6804000ab0 nRanks 96 busId 43000 e08r2n15:22024:24654 [2] NCCL INFO Channel 01 : 30[43000] -> 29[26000] via P2P/IPC comm 0x2b14a0000ab0 nRanks 96 e08r2n14:18195:20820 [2] NCCL INFO Connected all rings comm 0x2b7728000ab0 nRanks 96 busId 43000 e08r2n18:754:3475 [2] NCCL INFO Channel 01 : 42[43000] -> 41[26000] via P2P/IPC comm 0x2b2c8c000ab0 nRanks 96 e08r3n07:4892:7207 [2] NCCL INFO Connected all rings comm 0x2b98d4000ab0 nRanks 96 busId 43000 e08r2n11:5733:8341 [2] NCCL INFO Channel 00 : 14[43000] -> 13[26000] via P2P/IPC comm 0x2ae954000ab0 nRanks 96 e08r3n02:30404:32518 [2] NCCL INFO Connected all rings comm 0x2b6a10000ab0 nRanks 96 busId 43000 e08r2n16:13445:16161 [2] NCCL INFO Channel 00 : 34[43000] -> 33[26000] via P2P/IPC comm 0x2b6a48000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Channel 00 : 46[43000] -> 45[26000] via P2P/IPC comm 0x2b0610000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Connected all rings comm 0x2b5118000ab0 nRanks 96 busId 43000 e08r3n00:14535:16698 [2] NCCL INFO Channel 00 : 50[43000] -> 49[26000] via P2P/IPC comm 0x2bb1cc000ab0 nRanks 96 e08r3n11:29648:32286 [2] NCCL INFO Connected all rings comm 0x2b900c000ab0 nRanks 96 busId 43000 e08r3n05:24734:27392 [2] NCCL INFO Connected all rings comm 0x2b2914000ab0 nRanks 96 busId 43000 e08r2n13:23994:26734 [2] NCCL INFO Channel 00 : 22[43000] -> 21[26000] via P2P/IPC comm 0x2b5ff4000ab0 nRanks 96 e08r2n11:5733:8341 [2] NCCL INFO Channel 01 : 14[43000] -> 13[26000] via P2P/IPC comm 0x2ae954000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Connected all rings comm 0x2b15fc000ab0 nRanks 96 busId 43000 e08r2n17:21283:23951 [2] NCCL INFO Channel 00 : 38[43000] -> 37[26000] via P2P/IPC comm 0x2b9988000ab0 nRanks 96 e08r2n12:8674:11365 [2] NCCL INFO Channel 00 : 18[43000] -> 17[26000] via P2P/IPC comm 0x2b6804000ab0 nRanks 96 e08r2n16:13445:16161 [2] NCCL INFO Channel 01 : 34[43000] -> 33[26000] via P2P/IPC comm 0x2b6a48000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Channel 01 : 46[43000] -> 45[26000] via P2P/IPC comm 0x2b0610000ab0 nRanks 96 e08r3n09:8678:11333 [2] NCCL INFO Connected all rings comm 0x2b235c000ab0 nRanks 96 busId 43000 e08r2n14:18195:20820 [2] NCCL INFO Channel 00 : 26[43000] -> 25[26000] via P2P/IPC comm 0x2b7728000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Connected all rings comm 0x2ae928000ab0 nRanks 96 busId 43000 e08r3n03:22738:25418 [2] NCCL INFO Connected all rings comm 0x2af6a0000ab0 nRanks 96 busId 43000 e08r3n07:4892:7207 [2] NCCL INFO Channel 00 : 78[43000] -> 77[26000] via P2P/IPC comm 0x2b98d4000ab0 nRanks 96 e08r2n13:23994:26734 [2] NCCL INFO Channel 01 : 22[43000] -> 21[26000] via P2P/IPC comm 0x2b5ff4000ab0 nRanks 96 e08r3n00:14535:16698 [2] NCCL INFO Channel 01 : 50[43000] -> 49[26000] via P2P/IPC comm 0x2bb1cc000ab0 nRanks 96 e08r3n02:30404:32518 [2] NCCL INFO Channel 00 : 58[43000] -> 57[26000] via P2P/IPC comm 0x2b6a10000ab0 nRanks 96 e08r2n17:21283:23951 [2] NCCL INFO Channel 01 : 38[43000] -> 37[26000] via P2P/IPC comm 0x2b9988000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Channel 00 : 66[43000] -> 65[26000] via P2P/IPC comm 0x2b5118000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Connected all rings comm 0x2b1280000ab0 nRanks 96 busId 43000 e08r2n14:18195:20820 [2] NCCL INFO Channel 01 : 26[43000] -> 25[26000] via P2P/IPC comm 0x2b7728000ab0 nRanks 96 e08r2n09:27005:29650 [2] NCCL INFO Connected all rings comm 0x2b40ac000ab0 nRanks 96 busId 43000 e08r2n12:8674:11365 [2] NCCL INFO Channel 01 : 18[43000] -> 17[26000] via P2P/IPC comm 0x2b6804000ab0 nRanks 96 e08r3n07:4892:7207 [2] NCCL INFO Channel 01 : 78[43000] -> 77[26000] via P2P/IPC comm 0x2b98d4000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Connected all rings comm 0x2b5e3c000ab0 nRanks 96 busId 43000 e08r3n02:30404:32518 [2] NCCL INFO Channel 01 : 58[43000] -> 57[26000] via P2P/IPC comm 0x2b6a10000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Channel 00 : 74[43000] -> 73[26000] via P2P/IPC comm 0x2b15fc000ab0 nRanks 96 e08r3n11:29648:32286 [2] NCCL INFO Channel 00 : 94[43000] -> 93[26000] via P2P/IPC comm 0x2b900c000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Channel 01 : 66[43000] -> 65[26000] via P2P/IPC comm 0x2b5118000ab0 nRanks 96 e08r2n10:875:3571 [2] NCCL INFO Connected all rings comm 0x2afb28000ab0 nRanks 96 busId 43000 e08r3n09:8678:11333 [2] NCCL INFO Channel 00 : 86[43000] -> 85[26000] via P2P/IPC comm 0x2b235c000ab0 nRanks 96 e08r3n03:22738:25418 [2] NCCL INFO Channel 00 : 62[43000] -> 61[26000] via P2P/IPC comm 0x2af6a0000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Channel 00 : 90[43000] -> 89[26000] via P2P/IPC comm 0x2ae928000ab0 nRanks 96 e08r3n11:29648:32286 [2] NCCL INFO Channel 01 : 94[43000] -> 93[26000] via P2P/IPC comm 0x2b900c000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Channel 01 : 74[43000] -> 73[26000] via P2P/IPC comm 0x2b15fc000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Connected all rings comm 0x2b919c000ab0 nRanks 96 busId 43000 e08r2n09:27005:29650 [2] NCCL INFO Channel 00 : 6[43000] -> 5[26000] via P2P/IPC comm 0x2b40ac000ab0 nRanks 96 e08r3n09:8678:11333 [2] NCCL INFO Channel 01 : 86[43000] -> 85[26000] via P2P/IPC comm 0x2b235c000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Channel 01 : 90[43000] -> 89[26000] via P2P/IPC comm 0x2ae928000ab0 nRanks 96 e08r3n03:22738:25418 [2] NCCL INFO Channel 01 : 62[43000] -> 61[26000] via P2P/IPC comm 0x2af6a0000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Channel 00 : 54[43000] -> 53[26000] via P2P/IPC comm 0x2b1280000ab0 nRanks 96 e08r2n09:27005:29650 [2] NCCL INFO Channel 01 : 6[43000] -> 5[26000] via P2P/IPC comm 0x2b40ac000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Channel 00 : 2[43000] -> 1[26000] via P2P/IPC comm 0x2b5e3c000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Channel 01 : 54[43000] -> 53[26000] via P2P/IPC comm 0x2b1280000ab0 nRanks 96 e08r2n10:875:3571 [2] NCCL INFO Channel 00 : 10[43000] -> 9[26000] via P2P/IPC comm 0x2afb28000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Channel 00 : 82[43000] -> 81[26000] via P2P/IPC comm 0x2b919c000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Channel 01 : 2[43000] -> 1[26000] via P2P/IPC comm 0x2b5e3c000ab0 nRanks 96 e08r2n10:875:3571 [2] NCCL INFO Channel 01 : 10[43000] -> 9[26000] via P2P/IPC comm 0x2afb28000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Channel 01 : 82[43000] -> 81[26000] via P2P/IPC comm 0x2b919c000ab0 nRanks 96 e08r3n05:24734:27392 [2] NCCL INFO Channel 00 : 70[43000] -> 69[26000] via P2P/IPC comm 0x2b2914000ab0 nRanks 96 e08r3n05:24734:27392 [2] NCCL INFO Channel 01 : 70[43000] -> 69[26000] via P2P/IPC comm 0x2b2914000ab0 nRanks 96 e08r2n18:755:3474 [3] NCCL INFO Connected all rings comm 0x2b8210000ab0 nRanks 96 busId 63000 e08r2n18:755:3474 [3] NCCL INFO Channel 00 : 43[63000] -> 42[43000] via P2P/IPC comm 0x2b8210000ab0 nRanks 96 e08r2n18:755:3474 [3] NCCL INFO Channel 01 : 43[63000] -> 42[43000] via P2P/IPC comm 0x2b8210000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO Connected all rings comm 0x2b3468000ab0 nRanks 96 busId 63000 e08r3n00:14536:16697 [3] NCCL INFO Connected all rings comm 0x2b79d4000ab0 nRanks 96 busId 63000 e08r3n00:14536:16697 [3] NCCL INFO Channel 00 : 51[63000] -> 50[43000] via P2P/IPC comm 0x2b79d4000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO Channel 00 : 31[63000] -> 30[43000] via P2P/IPC comm 0x2b3468000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO Channel 01 : 31[63000] -> 30[43000] via P2P/IPC comm 0x2b3468000ab0 nRanks 96 e08r3n00:14536:16697 [3] NCCL INFO Channel 01 : 51[63000] -> 50[43000] via P2P/IPC comm 0x2b79d4000ab0 nRanks 96 e08r2n14:18196:20819 [3] NCCL INFO Connected all rings comm 0x2ab848000ab0 nRanks 96 busId 63000 e08r2n14:18196:20819 [3] NCCL INFO Channel 00 : 27[63000] -> 26[43000] via P2P/IPC comm 0x2ab848000ab0 nRanks 96 e08r3n11:29649:32285 [3] NCCL INFO Connected all rings comm 0x2ba94c000ab0 nRanks 96 busId 63000 e08r3n11:29649:32285 [3] NCCL INFO Channel 00 : 95[63000] -> 94[43000] via P2P/IPC comm 0x2ba94c000ab0 nRanks 96 e08r2n16:13446:16166 [3] NCCL INFO Connected all rings comm 0x2ac21c000ab0 nRanks 96 busId 63000 e08r2n19:9034:11808 [3] NCCL INFO Connected all rings comm 0x2b6ba4000ab0 nRanks 96 busId 63000 e08r2n16:13446:16166 [3] NCCL INFO Channel 00 : 35[63000] -> 34[43000] via P2P/IPC comm 0x2ac21c000ab0 nRanks 96 e08r2n19:9034:11808 [3] NCCL INFO Channel 00 : 47[63000] -> 46[43000] via P2P/IPC comm 0x2b6ba4000ab0 nRanks 96 e08r3n04:16940:19060 [3] NCCL INFO Connected all rings comm 0x2b208c000ab0 nRanks 96 busId 63000 e08r3n04:16940:19060 [3] NCCL INFO Channel 00 : 67[63000] -> 66[43000] via P2P/IPC comm 0x2b208c000ab0 nRanks 96 e08r3n09:8679:11332 [3] NCCL INFO Connected all rings comm 0x2b0eac000ab0 nRanks 96 busId 63000 e08r3n11:29649:32285 [3] NCCL INFO Channel 01 : 95[63000] -> 94[43000] via P2P/IPC comm 0x2ba94c000ab0 nRanks 96 e08r3n09:8679:11332 [3] NCCL INFO Channel 00 : 87[63000] -> 86[43000] via P2P/IPC comm 0x2b0eac000ab0 nRanks 96 e08r2n19:9034:11808 [3] NCCL INFO Channel 01 : 47[63000] -> 46[43000] via P2P/IPC comm 0x2b6ba4000ab0 nRanks 96 e08r2n14:18196:20819 [3] NCCL INFO Channel 01 : 27[63000] -> 26[43000] via P2P/IPC comm 0x2ab848000ab0 nRanks 96 e08r2n16:13446:16166 [3] NCCL INFO Channel 01 : 35[63000] -> 34[43000] via P2P/IPC comm 0x2ac21c000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO Connected all rings comm 0x2b9418000ab0 nRanks 96 busId 63000 e08r3n04:16940:19060 [3] NCCL INFO Channel 01 : 67[63000] -> 66[43000] via P2P/IPC comm 0x2b208c000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO Channel 00 : 75[63000] -> 74[43000] via P2P/IPC comm 0x2b9418000ab0 nRanks 96 e08r3n09:8679:11332 [3] NCCL INFO Channel 01 : 87[63000] -> 86[43000] via P2P/IPC comm 0x2b0eac000ab0 nRanks 96 e08r3n02:30405:32517 [3] NCCL INFO Connected all rings comm 0x2b6b88000ab0 nRanks 96 busId 63000 e08r3n03:22739:25421 [3] NCCL INFO Connected all rings comm 0x2b0784000ab0 nRanks 96 busId 63000 e08r3n03:22739:25421 [3] NCCL INFO Channel 00 : 63[63000] -> 62[43000] via P2P/IPC comm 0x2b0784000ab0 nRanks 96 e08r3n02:30405:32517 [3] NCCL INFO Channel 00 : 59[63000] -> 58[43000] via P2P/IPC comm 0x2b6b88000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO Channel 01 : 75[63000] -> 74[43000] via P2P/IPC comm 0x2b9418000ab0 nRanks 96 e08r3n07:4893:7208 [3] NCCL INFO Connected all rings comm 0x2ba900000ab0 nRanks 96 busId 63000 e08r3n07:4893:7208 [3] NCCL INFO Channel 00 : 79[63000] -> 78[43000] via P2P/IPC comm 0x2ba900000ab0 nRanks 96 e08r3n03:22739:25421 [3] NCCL INFO Channel 01 : 63[63000] -> 62[43000] via P2P/IPC comm 0x2b0784000ab0 nRanks 96 e08r2n11:5734:8345 [3] NCCL INFO Connected all rings comm 0x2b4320000ab0 nRanks 96 busId 63000 e08r3n02:30405:32517 [3] NCCL INFO Channel 01 : 59[63000] -> 58[43000] via P2P/IPC comm 0x2b6b88000ab0 nRanks 96 e08r2n11:5734:8345 [3] NCCL INFO Channel 00 : 15[63000] -> 14[43000] via P2P/IPC comm 0x2b4320000ab0 nRanks 96 e08r3n05:24735:27390 [3] NCCL INFO Connected all rings comm 0x2ac47c000ab0 nRanks 96 busId 63000 e08r3n05:24735:27390 [3] NCCL INFO Channel 00 : 71[63000] -> 70[43000] via P2P/IPC comm 0x2ac47c000ab0 nRanks 96 e08r3n07:4893:7208 [3] NCCL INFO Channel 01 : 79[63000] -> 78[43000] via P2P/IPC comm 0x2ba900000ab0 nRanks 96 e08r2n18:755:3474 [3] NCCL INFO Connected all trees comm 0x2b8210000ab0 nRanks 96 busId 63000 e08r2n18:755:3474 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:755:3474 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5734:8345 [3] NCCL INFO Channel 01 : 15[63000] -> 14[43000] via P2P/IPC comm 0x2b4320000ab0 nRanks 96 e08r3n05:24735:27390 [3] NCCL INFO Channel 01 : 71[63000] -> 70[43000] via P2P/IPC comm 0x2ac47c000ab0 nRanks 96 e08r2n08:5142:8204 [3] NCCL INFO Connected all rings comm 0x2ad70c000ab0 nRanks 96 busId 63000 e08r3n01:6279:8492 [3] NCCL INFO Connected all rings comm 0x2aecbc000ab0 nRanks 96 busId 63000 e08r2n08:5142:8204 [3] NCCL INFO Channel 00 : 3[63000] -> 2[43000] via P2P/IPC comm 0x2ad70c000ab0 nRanks 96 e08r3n01:6279:8492 [3] NCCL INFO Channel 00 : 55[63000] -> 54[43000] via P2P/IPC comm 0x2aecbc000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Connected all rings comm 0x2b4c88000ab0 nRanks 96 busId 4000 e08r2n19:9030:11813 [0] NCCL INFO Connected all rings comm 0x2ab5e8000ab0 nRanks 96 busId 4000 e08r3n00:14536:16697 [3] NCCL INFO Connected all trees comm 0x2b79d4000ab0 nRanks 96 busId 63000 e08r3n08:13438:16173 [3] NCCL INFO Connected all rings comm 0x2b2878000ab0 nRanks 96 busId 63000 e08r2n15:22025:24655 [3] NCCL INFO Connected all trees comm 0x2b3468000ab0 nRanks 96 busId 63000 e08r3n08:13438:16173 [3] NCCL INFO Channel 00 : 83[63000] -> 82[43000] via P2P/IPC comm 0x2b2878000ab0 nRanks 96 e08r2n15:22025:24655 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22025:24655 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14536:16697 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5142:8204 [3] NCCL INFO Channel 01 : 3[63000] -> 2[43000] via P2P/IPC comm 0x2ad70c000ab0 nRanks 96 e08r3n00:14536:16697 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6279:8492 [3] NCCL INFO Channel 01 : 55[63000] -> 54[43000] via P2P/IPC comm 0x2aecbc000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Connected all rings comm 0x2ac0ac000ab0 nRanks 96 busId 4000 e08r3n08:13438:16173 [3] NCCL INFO Channel 01 : 83[63000] -> 82[43000] via P2P/IPC comm 0x2b2878000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Connected all rings comm 0x2b5f80000ab0 nRanks 96 busId 4000 e08r3n10:18788:21518 [3] NCCL INFO Connected all rings comm 0x2adaac000ab0 nRanks 96 busId 63000 e08r3n10:18788:21518 [3] NCCL INFO Channel 00 : 91[63000] -> 90[43000] via P2P/IPC comm 0x2adaac000ab0 nRanks 96 e08r3n11:29649:32285 [3] NCCL INFO Connected all trees comm 0x2ba94c000ab0 nRanks 96 busId 63000 e08r3n11:29649:32285 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5136:8202 [0] NCCL INFO Connected all rings comm 0x2b30a8000ab0 nRanks 96 busId 4000 e08r3n11:29649:32285 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18196:20819 [3] NCCL INFO Connected all trees comm 0x2ab848000ab0 nRanks 96 busId 63000 e08r2n10:876:3570 [3] NCCL INFO Connected all rings comm 0x2b2f70000ab0 nRanks 96 busId 63000 e08r3n10:18788:21518 [3] NCCL INFO Channel 01 : 91[63000] -> 90[43000] via P2P/IPC comm 0x2adaac000ab0 nRanks 96 e08r2n14:18196:20819 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18196:20819 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:876:3570 [3] NCCL INFO Channel 00 : 11[63000] -> 10[43000] via P2P/IPC comm 0x2b2f70000ab0 nRanks 96 e08r2n16:13446:16166 [3] NCCL INFO Connected all trees comm 0x2ac21c000ab0 nRanks 96 busId 63000 e08r3n01:6275:8490 [0] NCCL INFO Connected all rings comm 0x2b899c000ab0 nRanks 96 busId 4000 e08r3n09:8679:11332 [3] NCCL INFO Connected all trees comm 0x2b0eac000ab0 nRanks 96 busId 63000 e08r3n11:29648:32286 [2] NCCL INFO Connected all trees comm 0x2b900c000ab0 nRanks 96 busId 43000 e08r2n16:13446:16166 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8679:11332 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29648:32286 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16940:19060 [3] NCCL INFO Connected all trees comm 0x2b208c000ab0 nRanks 96 busId 63000 e08r2n16:13446:16166 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8679:11332 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n11:29648:32286 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16940:19060 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16940:19060 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9034:11808 [3] NCCL INFO Connected all trees comm 0x2b6ba4000ab0 nRanks 96 busId 63000 e08r2n19:9034:11808 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:876:3570 [3] NCCL INFO Channel 01 : 11[63000] -> 10[43000] via P2P/IPC comm 0x2b2f70000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Connected all rings comm 0x2b4768000ab0 nRanks 96 busId 4000 e08r2n19:9034:11808 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22739:25421 [3] NCCL INFO Connected all trees comm 0x2b0784000ab0 nRanks 96 busId 63000 e08r3n03:22739:25421 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22285:25007 [3] NCCL INFO Connected all trees comm 0x2b9418000ab0 nRanks 96 busId 63000 e08r3n03:22739:25421 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n06:22285:25007 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22285:25007 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4889:7203 [0] NCCL INFO Connected all rings comm 0x2aefdc000ab0 nRanks 96 busId 4000 e08r3n02:30405:32517 [3] NCCL INFO Connected all trees comm 0x2b6b88000ab0 nRanks 96 busId 63000 e08r3n07:4893:7208 [3] NCCL INFO Connected all trees comm 0x2ba900000ab0 nRanks 96 busId 63000 e08r3n05:24731:27398 [0] NCCL INFO Connected all rings comm 0x2b883c000ab0 nRanks 96 busId 4000 e08r3n02:30405:32517 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4893:7208 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30405:32517 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4893:7208 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21280:23959 [0] NCCL INFO Connected all rings comm 0x2b01f0000ab0 nRanks 96 busId 4000 e08r3n05:24735:27390 [3] NCCL INFO Connected all trees comm 0x2ac47c000ab0 nRanks 96 busId 63000 e08r3n02:30401:32525 [0] NCCL INFO Connected all rings comm 0x2badc0000ab0 nRanks 96 busId 4000 e08r2n11:5734:8345 [3] NCCL INFO Connected all trees comm 0x2b4320000ab0 nRanks 96 busId 63000 e08r3n05:24735:27390 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24735:27390 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:19068 [0] NCCL INFO Connected all rings comm 0x2b37d8000ab0 nRanks 96 busId 4000 e08r3n06:22281:25013 [0] NCCL INFO Connected all rings comm 0x2afc48000ab0 nRanks 96 busId 4000 e08r2n11:5734:8345 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5734:8345 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n10:18784:21522 [0] NCCL INFO Connected all rings comm 0x2af26c000ab0 nRanks 96 busId 4000 e08r2n08:5142:8204 [3] NCCL INFO Connected all trees comm 0x2ad70c000ab0 nRanks 96 busId 63000 e08r2n08:5142:8204 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5142:8204 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6279:8492 [3] NCCL INFO Connected all trees comm 0x2aecbc000ab0 nRanks 96 busId 63000 e08r2n18:751:3479 [0] NCCL INFO Connected all rings comm 0x2b8398000ab0 nRanks 96 busId 4000 e08r2n12:8671:11366 [0] NCCL INFO Connected all rings comm 0x2b6958000ab0 nRanks 96 busId 4000 e08r2n11:5730:8342 [0] NCCL INFO Connected all rings comm 0x2b7cc4000ab0 nRanks 96 busId 4000 e08r3n01:6279:8492 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6279:8492 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23995:26735 [3] NCCL INFO Connected all rings comm 0x2b4d6c000ab0 nRanks 96 busId 63000 e08r3n08:13438:16173 [3] NCCL INFO Connected all trees comm 0x2b2878000ab0 nRanks 96 busId 63000 e08r3n11:29645:32290 [0] NCCL INFO Connected all rings comm 0x2ac49c000ab0 nRanks 96 busId 4000 e08r2n13:23995:26735 [3] NCCL INFO Channel 00 : 23[63000] -> 22[43000] via P2P/IPC comm 0x2b4d6c000ab0 nRanks 96 e08r2n08:5141:8206 [2] NCCL INFO Connected all trees comm 0x2b5e3c000ab0 nRanks 96 busId 43000 e08r3n08:13438:16173 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5141:8206 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5141:8206 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n08:13438:16173 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23995:26735 [3] NCCL INFO Channel 01 : 23[63000] -> 22[43000] via P2P/IPC comm 0x2b4d6c000ab0 nRanks 96 e08r2n17:21284:23952 [3] NCCL INFO Connected all rings comm 0x2ba784000ab0 nRanks 96 busId 63000 e08r3n10:18788:21518 [3] NCCL INFO Connected all trees comm 0x2adaac000ab0 nRanks 96 busId 63000 e08r2n17:21284:23952 [3] NCCL INFO Channel 00 : 39[63000] -> 38[43000] via P2P/IPC comm 0x2ba784000ab0 nRanks 96 e08r3n10:18788:21518 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18788:21518 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27002:29647 [0] NCCL INFO Connected all rings comm 0x2b0f80000ab0 nRanks 96 busId 4000 e08r3n08:13434:16175 [0] NCCL INFO Connected all rings comm 0x2abf58000ab0 nRanks 96 busId 4000 e08r2n17:21284:23952 [3] NCCL INFO Channel 01 : 39[63000] -> 38[43000] via P2P/IPC comm 0x2ba784000ab0 nRanks 96 e08r2n10:876:3570 [3] NCCL INFO Connected all trees comm 0x2b2f70000ab0 nRanks 96 busId 63000 e08r2n10:876:3570 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:876:3570 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8675:11338 [0] NCCL INFO Connected all rings comm 0x2b43d0000ab0 nRanks 96 busId 4000 e08r2n13:23991:26733 [0] NCCL INFO Connected all rings comm 0x2b51f4000ab0 nRanks 96 busId 4000 e08r2n14:18192:20826 [0] NCCL INFO Connected all rings comm 0x2b8b18000ab0 nRanks 96 busId 4000 e08r2n10:872:3576 [0] NCCL INFO Connected all rings comm 0x2b62a4000ab0 nRanks 96 busId 4000 e08r2n13:23995:26735 [3] NCCL INFO Connected all trees comm 0x2b4d6c000ab0 nRanks 96 busId 63000 e08r2n13:23995:26735 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23995:26735 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21284:23952 [3] NCCL INFO Connected all trees comm 0x2ba784000ab0 nRanks 96 busId 63000 e08r2n17:21284:23952 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21284:23952 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8675:11360 [3] NCCL INFO Connected all rings comm 0x2b3078000ab0 nRanks 96 busId 63000 e08r2n12:8675:11360 [3] NCCL INFO Channel 00 : 19[63000] -> 18[43000] via P2P/IPC comm 0x2b3078000ab0 nRanks 96 e08r2n09:27006:29649 [3] NCCL INFO Connected all rings comm 0x2b5948000ab0 nRanks 96 busId 63000 e08r2n09:27006:29649 [3] NCCL INFO Channel 00 : 7[63000] -> 6[43000] via P2P/IPC comm 0x2b5948000ab0 nRanks 96 e08r2n12:8675:11360 [3] NCCL INFO Channel 01 : 19[63000] -> 18[43000] via P2P/IPC comm 0x2b3078000ab0 nRanks 96 e08r2n09:27006:29649 [3] NCCL INFO Channel 01 : 7[63000] -> 6[43000] via P2P/IPC comm 0x2b5948000ab0 nRanks 96 e08r2n09:27006:29649 [3] NCCL INFO Connected all trees comm 0x2b5948000ab0 nRanks 96 busId 63000 e08r2n12:8675:11360 [3] NCCL INFO Connected all trees comm 0x2b3078000ab0 nRanks 96 busId 63000 e08r2n12:8675:11360 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8675:11360 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27006:29649 [3] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27006:29649 [3] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13442:16162 [0] NCCL INFO Channel 01/0 : 32[4000] -> 36[4000] [send] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 01/0 : 48[4000] -> 52[4000] [send] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 00/0 : 40[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 00/0 : 24[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 01/0 : 0[4000] -> 4[4000] [send] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 00/0 : 56[4000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01/0 : 48[4000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 01/0 : 64[4000] -> 68[4000] [send] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 00/0 : 72[4000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 01/0 : 53[26000] -> 56[4000] [receive] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01/0 : 64[4000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 01/0 : 69[26000] -> 72[4000] [receive] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 01/0 : 85[26000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01/0 : 32[4000] -> 36[4000] [receive] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 01/0 : 37[26000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 01/0 : 16[4000] -> 20[4000] [send] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 00/0 : 88[4000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 01/0 : 80[4000] -> 84[4000] [send] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 00/0 : 8[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01/0 : 0[4000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01/0 : 80[4000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 01/0 : 21[26000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01/0 : 16[4000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 01/0 : 5[26000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 00/0 : 48[4000] -> 56[4000] [send] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 00/0 : 64[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n05:24733:27396 [1] NCCL INFO Channel 01/0 : 72[4000] -> 69[26000] [receive] via NET/IB/0 comm 0x2abc38000ab0 nRanks 96 e08r3n09:8677:11336 [1] NCCL INFO Channel 01/0 : 88[4000] -> 85[26000] [receive] via NET/IB/0 comm 0x2b45a8000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 00/0 : 32[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r3n01:6277:8491 [1] NCCL INFO Channel 01/0 : 56[4000] -> 53[26000] [receive] via NET/IB/0 comm 0x2ba5b0000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO Channel 01/0 : 40[4000] -> 37[26000] [receive] via NET/IB/0 comm 0x2ac164000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 00/0 : 64[4000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 00/0 : 68[4000] -> 73[26000] [send] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00/0 : 80[4000] -> 88[4000] [send] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 00/0 : 36[4000] -> 41[26000] [send] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 01/0 : 24[4000] -> 21[26000] [receive] via NET/IB/0 comm 0x2b42c0000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00/0 : 16[4000] -> 24[4000] [send] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00/0 : 88[4000] -> 92[4000] [send] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r2n09:27004:29648 [1] NCCL INFO Channel 01/0 : 8[4000] -> 5[26000] [receive] via NET/IB/0 comm 0x2af944000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 00/0 : 56[4000] -> 60[4000] [send] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 00/0 : 84[4000] -> 89[26000] [send] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00/0 : 72[4000] -> 76[4000] [send] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 00/0 : 52[4000] -> 57[26000] [send] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 00/0 : 20[4000] -> 25[26000] [send] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 00/0 : 4[4000] -> 9[26000] [send] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00/0 : 40[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00/0 : 24[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00/0 : 8[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01/0 : 68[4000] -> 76[4000] [send] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01/0 : 36[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00/0 : 80[4000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00/0 : 72[4000] -> 81[26000] [send] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01/0 : 77[26000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n06:22283:25009 [1] NCCL INFO Channel 00/0 : 73[26000] -> 68[4000] [send] via NET/IB/0 comm 0x2b9cec000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01/0 : 45[26000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01/0 : 4[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01/0 : 13[26000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00/0 : 40[4000] -> 49[26000] [send] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Channel 00/0 : 41[26000] -> 36[4000] [send] via NET/IB/0 comm 0x2b3358000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 00/0 : 89[26000] -> 84[4000] [send] via NET/IB/0 comm 0x2ac5c0000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00/0 : 16[4000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r3n02:30403:32523 [1] NCCL INFO Channel 00/0 : 57[26000] -> 52[4000] [send] via NET/IB/0 comm 0x2ba378000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 00/0 : 48[4000] -> 56[4000] [receive] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 00/0 : 25[26000] -> 20[4000] [send] via NET/IB/0 comm 0x2b4618000ab0 nRanks 96 e08r2n10:874:3574 [1] NCCL INFO Channel 00/0 : 9[26000] -> 4[4000] [send] via NET/IB/0 comm 0x2b20f0000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00/0 : 8[4000] -> 17[26000] [send] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 01/0 : 92[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01/0 : 68[4000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01/0 : 44[4000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01/0 : 36[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01/0 : 12[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01/0 : 4[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 01/0 : 84[4000] -> 77[26000] [receive] via NET/IB/0 comm 0x2b7cf8000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00/0 : 81[26000] -> 72[4000] [receive] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00/0 : 64[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n19:9032:11812 [1] NCCL INFO Channel 01/0 : 52[4000] -> 45[26000] [receive] via NET/IB/0 comm 0x2af85c000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00/0 : 49[26000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 01/0 : 20[4000] -> 13[26000] [receive] via NET/IB/0 comm 0x2b1404000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00/0 : 16[4000] -> 33[26000] [send] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01/0 : 76[4000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00/0 : 88[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 00/0 : 81[26000] -> 72[4000] [send] via NET/IB/0 comm 0x2b1bb8000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 00/0 : 32[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00/0 : 17[26000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01/0 : 84[4000] -> 77[26000] [send] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01/0 : 52[4000] -> 45[26000] [send] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r3n00:14534:16703 [1] NCCL INFO Channel 00/0 : 49[26000] -> 40[4000] [send] via NET/IB/0 comm 0x2b8e34000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01/0 : 20[4000] -> 13[26000] [send] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01/0 : 44[4000] -> 36[4000] [receive] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 00/0 : 17[26000] -> 8[4000] [send] via NET/IB/0 comm 0x2b951c000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01/0 : 61[26000] -> 76[4000] [receive] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00/0 : 24[4000] -> 16[4000] [send] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01/0 : 44[4000] -> 60[4000] [send] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r3n02:30401:32525 [0] NCCL INFO Channel 00/0 : 56[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01/0 : 12[4000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01/0 : 12[4000] -> 28[4000] [send] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 00 : 81[26000] -> 80[4000] via P2P/IPC comm 0x2b1bb8000ab0 nRanks 96 e08r3n08:13436:16169 [1] NCCL INFO Channel 01 : 81[26000] -> 80[4000] via P2P/IPC comm 0x2b1bb8000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 00 : 17[26000] -> 16[4000] via P2P/IPC comm 0x2b951c000ab0 nRanks 96 e08r3n00:14534:16703 [1] NCCL INFO Channel 00 : 49[26000] -> 48[4000] via P2P/IPC comm 0x2b8e34000ab0 nRanks 96 e08r3n00:14534:16703 [1] NCCL INFO Channel 01 : 49[26000] -> 48[4000] via P2P/IPC comm 0x2b8e34000ab0 nRanks 96 e08r2n12:8673:11362 [1] NCCL INFO Channel 01 : 17[26000] -> 16[4000] via P2P/IPC comm 0x2b951c000ab0 nRanks 96 e08r3n08:13437:16171 [2] NCCL INFO Connected all trees comm 0x2b919c000ab0 nRanks 96 busId 43000 e08r3n08:13437:16171 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13437:16171 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14535:16698 [2] NCCL INFO Connected all trees comm 0x2bb1cc000ab0 nRanks 96 busId 43000 e08r3n00:14535:16698 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8674:11365 [2] NCCL INFO Connected all trees comm 0x2b6804000ab0 nRanks 96 busId 43000 e08r3n00:14535:16698 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8674:11365 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8674:11365 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9032:11812 [1] NCCL INFO Channel 00 : 45[26000] -> 44[4000] via P2P/IPC comm 0x2af85c000ab0 nRanks 96 e08r2n19:9032:11812 [1] NCCL INFO Channel 01 : 45[26000] -> 44[4000] via P2P/IPC comm 0x2af85c000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 00 : 13[26000] -> 12[4000] via P2P/IPC comm 0x2b1404000ab0 nRanks 96 e08r2n11:5732:8346 [1] NCCL INFO Channel 01 : 13[26000] -> 12[4000] via P2P/IPC comm 0x2b1404000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 00 : 77[26000] -> 76[4000] via P2P/IPC comm 0x2b7cf8000ab0 nRanks 96 e08r3n07:4891:7204 [1] NCCL INFO Channel 01 : 77[26000] -> 76[4000] via P2P/IPC comm 0x2b7cf8000ab0 nRanks 96 e08r2n19:9033:11810 [2] NCCL INFO Connected all trees comm 0x2b0610000ab0 nRanks 96 busId 43000 e08r2n19:9033:11810 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5733:8341 [2] NCCL INFO Connected all trees comm 0x2ae954000ab0 nRanks 96 busId 43000 e08r2n19:9033:11810 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5733:8341 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5733:8341 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4892:7207 [2] NCCL INFO Connected all trees comm 0x2b98d4000ab0 nRanks 96 busId 43000 e08r3n07:4892:7207 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4892:7207 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:19068 [0] NCCL INFO Channel 00/0 : 64[4000] -> 0[4000] [send] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00/0 : 33[26000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 00/0 : 89[26000] -> 84[4000] [receive] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00/0 : 80[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 00/0 : 32[4000] -> 65[26000] [send] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 00/0 : 57[26000] -> 52[4000] [receive] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 00/0 : 25[26000] -> 20[4000] [receive] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 00/0 : 48[4000] -> 32[4000] [send] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 00/0 : 76[4000] -> 72[4000] [receive] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n03:22737:25417 [1] NCCL INFO Channel 01/0 : 76[4000] -> 61[26000] [receive] via NET/IB/0 comm 0x2ac904000ab0 nRanks 96 e08r2n16:13444:16165 [1] NCCL INFO Channel 00/0 : 33[26000] -> 16[4000] [send] via NET/IB/0 comm 0x2b03e8000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01/0 : 60[4000] -> 44[4000] [receive] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r2n18:751:3479 [0] NCCL INFO Channel 00/0 : 44[4000] -> 40[4000] [receive] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Channel 00/0 : 12[4000] -> 8[4000] [receive] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01/0 : 76[4000] -> 61[26000] [send] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01/0 : 29[26000] -> 60[4000] [receive] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01/0 : 28[4000] -> 12[4000] [receive] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01/0 : 92[4000] -> 28[4000] [receive] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 00 : 89[26000] -> 88[4000] via P2P/IPC comm 0x2ac5c0000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Channel 01 : 89[26000] -> 88[4000] via P2P/IPC comm 0x2ac5c0000ab0 nRanks 96 e08r3n02:30403:32523 [1] NCCL INFO Channel 00 : 57[26000] -> 56[4000] via P2P/IPC comm 0x2ba378000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 00 : 25[26000] -> 24[4000] via P2P/IPC comm 0x2b4618000ab0 nRanks 96 e08r3n02:30403:32523 [1] NCCL INFO Channel 01 : 57[26000] -> 56[4000] via P2P/IPC comm 0x2ba378000ab0 nRanks 96 e08r2n14:18194:20823 [1] NCCL INFO Channel 01 : 25[26000] -> 24[4000] via P2P/IPC comm 0x2b4618000ab0 nRanks 96 e08r2n16:13444:16165 [1] NCCL INFO Channel 00 : 33[26000] -> 32[4000] via P2P/IPC comm 0x2b03e8000ab0 nRanks 96 e08r2n16:13444:16165 [1] NCCL INFO Channel 01 : 33[26000] -> 32[4000] via P2P/IPC comm 0x2b03e8000ab0 nRanks 96 e08r3n10:18787:21519 [2] NCCL INFO Connected all trees comm 0x2ae928000ab0 nRanks 96 busId 43000 e08r3n10:18787:21519 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18787:21519 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30404:32518 [2] NCCL INFO Connected all trees comm 0x2b6a10000ab0 nRanks 96 busId 43000 e08r3n02:30404:32518 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30404:32518 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18195:20820 [2] NCCL INFO Connected all trees comm 0x2b7728000ab0 nRanks 96 busId 43000 e08r2n14:18195:20820 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18195:20820 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13445:16161 [2] NCCL INFO Connected all trees comm 0x2b6a48000ab0 nRanks 96 busId 43000 e08r2n16:13445:16161 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13445:16161 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22737:25417 [1] NCCL INFO Channel 00 : 61[26000] -> 60[4000] via P2P/IPC comm 0x2ac904000ab0 nRanks 96 e08r3n03:22737:25417 [1] NCCL INFO Channel 01 : 61[26000] -> 60[4000] via P2P/IPC comm 0x2ac904000ab0 nRanks 96 e08r3n03:22738:25418 [2] NCCL INFO Connected all trees comm 0x2af6a0000ab0 nRanks 96 busId 43000 e08r3n03:22738:25418 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22738:25418 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13442:16162 [0] NCCL INFO Channel 00/0 : 65[26000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 00/0 : 65[26000] -> 32[4000] [send] via NET/IB/0 comm 0x2b0ddc000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 00/0 : 0[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Channel 01/0 : 76[4000] -> 68[4000] [send] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 00/0 : 0[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n09:8675:11338 [0] NCCL INFO Channel 01/0 : 84[4000] -> 80[4000] [send] via NET/IB/0 comm 0x2b43d0000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Channel 01/0 : 52[4000] -> 48[4000] [send] via NET/IB/0 comm 0x2b899c000ab0 nRanks 96 e08r2n13:23991:26733 [0] NCCL INFO Channel 01/0 : 20[4000] -> 16[4000] [send] via NET/IB/0 comm 0x2b51f4000ab0 nRanks 96 e08r2n15:22023:24652 [1] NCCL INFO Channel 01/0 : 60[4000] -> 29[26000] [receive] via NET/IB/0 comm 0x2ad720000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 00/0 : 24[4000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01/0 : 60[4000] -> 29[26000] [send] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 01/0 : 28[4000] -> 92[4000] [receive] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01/0 : 28[4000] -> 92[4000] [send] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 00 : 65[26000] -> 64[4000] via P2P/IPC comm 0x2b0ddc000ab0 nRanks 96 e08r3n04:16938:19062 [1] NCCL INFO Channel 01 : 65[26000] -> 64[4000] via P2P/IPC comm 0x2b0ddc000ab0 nRanks 96 e08r3n04:16939:19064 [2] NCCL INFO Connected all trees comm 0x2b5118000ab0 nRanks 96 busId 43000 e08r3n04:16939:19064 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16939:19064 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n15:22023:24652 [1] NCCL INFO Channel 00 : 29[26000] -> 28[4000] via P2P/IPC comm 0x2ad720000ab0 nRanks 96 e08r2n15:22023:24652 [1] NCCL INFO Channel 01 : 29[26000] -> 28[4000] via P2P/IPC comm 0x2ad720000ab0 nRanks 96 e08r2n15:22024:24654 [2] NCCL INFO Connected all trees comm 0x2b14a0000ab0 nRanks 96 busId 43000 e08r2n15:22024:24654 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22024:24654 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4889:7203 [0] NCCL INFO Channel 00/0 : 76[4000] -> 72[4000] [send] via NET/IB/0 comm 0x2aefdc000ab0 nRanks 96 e08r2n08:5136:8202 [0] NCCL INFO Channel 01/0 : 4[4000] -> 0[4000] [receive] via NET/IB/0 comm 0x2b30a8000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 00/0 : 48[4000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 00/0 : 28[4000] -> 24[4000] [receive] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 00/0 : 80[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 01/0 : 60[4000] -> 44[4000] [send] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO Channel 01/0 : 20[4000] -> 16[4000] [receive] via NET/IB/0 comm 0x2b6958000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 00/0 : 73[26000] -> 68[4000] [receive] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 01/0 : 28[4000] -> 12[4000] [send] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r3n11:29645:32290 [0] NCCL INFO Channel 00/0 : 92[4000] -> 88[4000] [send] via NET/IB/0 comm 0x2ac49c000ab0 nRanks 96 e08r3n07:4889:7203 [0] NCCL INFO Connected all trees comm 0x2aefdc000ab0 nRanks 96 busId 4000 e08r3n07:4889:7203 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4889:7203 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n07:4891:7204 [1] NCCL INFO Connected all trees comm 0x2b7cf8000ab0 nRanks 96 busId 26000 e08r3n07:4891:7204 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n07:4891:7204 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n06:22283:25009 [1] NCCL INFO Channel 00 : 73[26000] -> 72[4000] via P2P/IPC comm 0x2b9cec000ab0 nRanks 96 e08r3n06:22283:25009 [1] NCCL INFO Channel 01 : 73[26000] -> 72[4000] via P2P/IPC comm 0x2b9cec000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO Connected all trees comm 0x2b15fc000ab0 nRanks 96 busId 43000 e08r3n06:22284:25008 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22284:25008 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8671:11366 [0] NCCL INFO Connected all trees comm 0x2b6958000ab0 nRanks 96 busId 4000 e08r2n12:8671:11366 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8671:11366 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n12:8673:11362 [1] NCCL INFO Connected all trees comm 0x2b951c000ab0 nRanks 96 busId 26000 e08r2n12:8673:11362 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n12:8673:11362 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14532:16701 [0] NCCL INFO Channel 00/0 : 56[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Channel 01/0 : 72[4000] -> 69[26000] [send] via NET/IB/0 comm 0x2afc48000ab0 nRanks 96 e08r3n03:22735:25423 [0] NCCL INFO Channel 00/0 : 60[4000] -> 56[4000] [send] via NET/IB/0 comm 0x2b4768000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 00/0 : 88[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n16:13442:16162 [0] NCCL INFO Channel 01/0 : 36[4000] -> 32[4000] [receive] via NET/IB/0 comm 0x2b4c88000ab0 nRanks 96 e08r3n04:16936:19068 [0] NCCL INFO Channel 01/0 : 68[4000] -> 64[4000] [receive] via NET/IB/0 comm 0x2b37d8000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Channel 00/0 : 28[4000] -> 24[4000] [send] via NET/IB/0 comm 0x2b5f80000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 01/0 : 44[4000] -> 36[4000] [send] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r3n05:24731:27398 [0] NCCL INFO Channel 01/0 : 68[4000] -> 64[4000] [send] via NET/IB/0 comm 0x2b883c000ab0 nRanks 96 e08r2n11:5730:8342 [0] NCCL INFO Channel 01/0 : 12[4000] -> 4[4000] [send] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r3n06:22281:25013 [0] NCCL INFO Connected all trees comm 0x2afc48000ab0 nRanks 96 busId 4000 e08r3n06:22281:25013 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22281:25013 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n06:22283:25009 [1] NCCL INFO Connected all trees comm 0x2b9cec000ab0 nRanks 96 busId 26000 e08r3n06:22283:25009 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n06:22283:25009 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24733:27396 [1] NCCL INFO Channel 00 : 69[26000] -> 68[4000] via P2P/IPC comm 0x2abc38000ab0 nRanks 96 e08r3n05:24733:27396 [1] NCCL INFO Channel 01 : 69[26000] -> 68[4000] via P2P/IPC comm 0x2abc38000ab0 nRanks 96 e08r2n15:22021:24653 [0] NCCL INFO Connected all trees comm 0x2b5f80000ab0 nRanks 96 busId 4000 e08r2n15:22021:24653 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24734:27392 [2] NCCL INFO Connected all trees comm 0x2b2914000ab0 nRanks 96 busId 43000 e08r2n15:22021:24653 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24734:27392 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24734:27392 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n15:22023:24652 [1] NCCL INFO Connected all trees comm 0x2ad720000ab0 nRanks 96 busId 26000 e08r2n15:22023:24652 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n15:22023:24652 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24731:27398 [0] NCCL INFO Connected all trees comm 0x2b883c000ab0 nRanks 96 busId 4000 e08r3n05:24731:27398 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24731:27398 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n05:24733:27396 [1] NCCL INFO Connected all trees comm 0x2abc38000ab0 nRanks 96 busId 26000 e08r3n05:24733:27396 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n05:24733:27396 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16936:19068 [0] NCCL INFO Connected all trees comm 0x2b37d8000ab0 nRanks 96 busId 4000 e08r3n04:16936:19068 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16936:19068 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n04:16938:19062 [1] NCCL INFO Connected all trees comm 0x2b0ddc000ab0 nRanks 96 busId 26000 e08r3n04:16938:19062 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n04:16938:19062 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30401:32525 [0] NCCL INFO Channel 00/0 : 60[4000] -> 56[4000] [receive] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 00/0 : 92[4000] -> 88[4000] [receive] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n00:14532:16701 [0] NCCL INFO Channel 01/0 : 52[4000] -> 48[4000] [receive] via NET/IB/0 comm 0x2ac0ac000ab0 nRanks 96 e08r3n08:13434:16175 [0] NCCL INFO Channel 01/0 : 84[4000] -> 80[4000] [receive] via NET/IB/0 comm 0x2abf58000ab0 nRanks 96 e08r2n19:9030:11813 [0] NCCL INFO Channel 00/0 : 44[4000] -> 40[4000] [send] via NET/IB/0 comm 0x2ab5e8000ab0 nRanks 96 e08r3n07:4892:7207 [2] NCCL INFO comm 0x2b98d4000ab0 rank 78 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n07:4891:7204 [1] NCCL INFO comm 0x2b7cf8000ab0 rank 77 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5730:8342 [0] NCCL INFO Channel 00/0 : 12[4000] -> 8[4000] [send] via NET/IB/0 comm 0x2b7cc4000ab0 nRanks 96 e08r2n14:18192:20826 [0] NCCL INFO Channel 01/0 : 24[4000] -> 21[26000] [send] via NET/IB/0 comm 0x2b8b18000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 00/0 : 41[26000] -> 36[4000] [receive] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 00/0 : 9[26000] -> 4[4000] [receive] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n12:8671:11366 [0] NCCL INFO comm 0x2b6958000ab0 rank 16 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n12:8674:11365 [2] NCCL INFO comm 0x2b6804000ab0 rank 18 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n12:8675:11360 [3] NCCL INFO comm 0x2b3078000ab0 rank 19 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n12:8673:11362 [1] NCCL INFO comm 0x2b951c000ab0 rank 17 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n07:4893:7208 [3] NCCL INFO comm 0x2ba900000ab0 rank 79 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n07:4889:7203 [0] NCCL INFO comm 0x2aefdc000ab0 rank 76 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n03:22735:25423 [0] NCCL INFO Connected all trees comm 0x2b4768000ab0 nRanks 96 busId 4000 e08r3n03:22735:25423 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22735:25423 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22737:25417 [1] NCCL INFO Connected all trees comm 0x2ac904000ab0 nRanks 96 busId 26000 e08r3n03:22737:25417 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n03:22737:25417 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n11:29645:32290 [0] NCCL INFO Connected all trees comm 0x2ac49c000ab0 nRanks 96 busId 4000 e08r3n11:29645:32290 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29645:32290 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n11:29647:32289 [1] NCCL INFO Connected all trees comm 0x2abf74000ab0 nRanks 96 busId 26000 e08r3n11:29647:32289 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n11:29647:32289 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9030:11813 [0] NCCL INFO Connected all trees comm 0x2ab5e8000ab0 nRanks 96 busId 4000 e08r2n19:9030:11813 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9030:11813 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n19:9032:11812 [1] NCCL INFO Connected all trees comm 0x2af85c000ab0 nRanks 96 busId 26000 e08r2n19:9032:11812 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n19:9032:11812 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14532:16701 [0] NCCL INFO Connected all trees comm 0x2ac0ac000ab0 nRanks 96 busId 4000 e08r3n00:14532:16701 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n00:14532:16701 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n00:14534:16703 [1] NCCL INFO Connected all trees comm 0x2b8e34000ab0 nRanks 96 busId 26000 e08r3n00:14534:16703 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5730:8342 [0] NCCL INFO Connected all trees comm 0x2b7cc4000ab0 nRanks 96 busId 4000 e08r3n00:14534:16703 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5730:8342 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n11:5730:8342 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n11:5732:8346 [1] NCCL INFO Connected all trees comm 0x2b1404000ab0 nRanks 96 busId 26000 e08r2n11:5732:8346 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18192:20826 [0] NCCL INFO Connected all trees comm 0x2b8b18000ab0 nRanks 96 busId 4000 e08r2n11:5732:8346 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18192:20826 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n14:18192:20826 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n08:13434:16175 [0] NCCL INFO Connected all trees comm 0x2abf58000ab0 nRanks 96 busId 4000 e08r3n08:13434:16175 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13434:16175 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n14:18194:20823 [1] NCCL INFO Connected all trees comm 0x2b4618000ab0 nRanks 96 busId 26000 e08r2n14:18194:20823 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13436:16169 [1] NCCL INFO Connected all trees comm 0x2b1bb8000ab0 nRanks 96 busId 26000 e08r2n14:18194:20823 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n08:13436:16169 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n08:13436:16169 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:753:3473 [1] NCCL INFO Channel 00 : 41[26000] -> 40[4000] via P2P/IPC comm 0x2b3358000ab0 nRanks 96 e08r2n18:753:3473 [1] NCCL INFO Channel 01 : 41[26000] -> 40[4000] via P2P/IPC comm 0x2b3358000ab0 nRanks 96 e08r2n10:874:3574 [1] NCCL INFO Channel 00 : 9[26000] -> 8[4000] via P2P/IPC comm 0x2b20f0000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 00 : 21[26000] -> 20[4000] via P2P/IPC comm 0x2b42c0000ab0 nRanks 96 e08r2n13:23993:26732 [1] NCCL INFO Channel 01 : 21[26000] -> 20[4000] via P2P/IPC comm 0x2b42c0000ab0 nRanks 96 e08r2n10:874:3574 [1] NCCL INFO Channel 01 : 9[26000] -> 8[4000] via P2P/IPC comm 0x2b20f0000ab0 nRanks 96 e08r2n18:754:3475 [2] NCCL INFO Connected all trees comm 0x2b2c8c000ab0 nRanks 96 busId 43000 e08r2n18:754:3475 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:754:3475 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23991:26733 [0] NCCL INFO Connected all trees comm 0x2b51f4000ab0 nRanks 96 busId 4000 e08r2n13:23991:26733 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23991:26733 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:875:3571 [2] NCCL INFO Connected all trees comm 0x2afb28000ab0 nRanks 96 busId 43000 e08r2n10:875:3571 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:875:3571 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23993:26732 [1] NCCL INFO Connected all trees comm 0x2b42c0000ab0 nRanks 96 busId 26000 e08r2n13:23993:26732 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23993:26732 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n13:23994:26734 [2] NCCL INFO Connected all trees comm 0x2b5ff4000ab0 nRanks 96 busId 43000 e08r2n13:23994:26734 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n13:23994:26734 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30401:32525 [0] NCCL INFO Channel 01/0 : 56[4000] -> 53[26000] [send] via NET/IB/0 comm 0x2badc0000ab0 nRanks 96 e08r3n10:18784:21522 [0] NCCL INFO Channel 01/0 : 88[4000] -> 85[26000] [send] via NET/IB/0 comm 0x2af26c000ab0 nRanks 96 e08r3n06:22284:25008 [2] NCCL INFO comm 0x2b15fc000ab0 rank 74 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n06:22281:25013 [0] NCCL INFO comm 0x2afc48000ab0 rank 72 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:751:3479 [0] NCCL INFO Channel 01/0 : 40[4000] -> 37[26000] [send] via NET/IB/0 comm 0x2b8398000ab0 nRanks 96 e08r3n06:22285:25007 [3] NCCL INFO comm 0x2b9418000ab0 rank 75 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n06:22283:25009 [1] NCCL INFO comm 0x2b9cec000ab0 rank 73 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n10:872:3576 [0] NCCL INFO Channel 01/0 : 8[4000] -> 5[26000] [send] via NET/IB/0 comm 0x2b62a4000ab0 nRanks 96 e08r2n17:21280:23959 [0] NCCL INFO Channel 01/0 : 36[4000] -> 32[4000] [send] via NET/IB/0 comm 0x2b01f0000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Channel 01/0 : 4[4000] -> 0[4000] [send] via NET/IB/0 comm 0x2b0f80000ab0 nRanks 96 e08r2n15:22023:24652 [1] NCCL INFO comm 0x2ad720000ab0 rank 29 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n04:16936:19068 [0] NCCL INFO comm 0x2b37d8000ab0 rank 64 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n04:16939:19064 [2] NCCL INFO comm 0x2b5118000ab0 rank 66 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n04:16940:19060 [3] NCCL INFO comm 0x2b208c000ab0 rank 67 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n04:16938:19062 [1] NCCL INFO comm 0x2b0ddc000ab0 rank 65 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n15:22024:24654 [2] NCCL INFO comm 0x2b14a0000ab0 rank 30 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n15:22021:24653 [0] NCCL INFO comm 0x2b5f80000ab0 rank 28 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n15:22025:24655 [3] NCCL INFO comm 0x2b3468000ab0 rank 31 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n05:24735:27390 [3] NCCL INFO comm 0x2ac47c000ab0 rank 71 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n05:24733:27396 [1] NCCL INFO comm 0x2abc38000ab0 rank 69 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n05:24734:27392 [2] NCCL INFO comm 0x2b2914000ab0 rank 70 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n05:24731:27398 [0] NCCL INFO comm 0x2b883c000ab0 rank 68 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n02:30401:32525 [0] NCCL INFO Connected all trees comm 0x2badc0000ab0 nRanks 96 busId 4000 e08r3n02:30401:32525 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30401:32525 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n02:30403:32523 [1] NCCL INFO Connected all trees comm 0x2ba378000ab0 nRanks 96 busId 26000 e08r3n02:30403:32523 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n02:30403:32523 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n10:18784:21522 [0] NCCL INFO Connected all trees comm 0x2af26c000ab0 nRanks 96 busId 4000 e08r3n10:18784:21522 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18784:21522 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6277:8491 [1] NCCL INFO Channel 00 : 53[26000] -> 52[4000] via P2P/IPC comm 0x2ba5b0000ab0 nRanks 96 e08r3n10:18786:21523 [1] NCCL INFO Connected all trees comm 0x2ac5c0000ab0 nRanks 96 busId 26000 e08r3n10:18786:21523 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n10:18786:21523 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6277:8491 [1] NCCL INFO Channel 01 : 53[26000] -> 52[4000] via P2P/IPC comm 0x2ba5b0000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO Connected all trees comm 0x2b899c000ab0 nRanks 96 busId 4000 e08r3n09:8677:11336 [1] NCCL INFO Channel 00 : 85[26000] -> 84[4000] via P2P/IPC comm 0x2b45a8000ab0 nRanks 96 e08r3n01:6275:8490 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6275:8490 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8677:11336 [1] NCCL INFO Channel 01 : 85[26000] -> 84[4000] via P2P/IPC comm 0x2b45a8000ab0 nRanks 96 e08r3n01:6278:8493 [2] NCCL INFO Connected all trees comm 0x2b1280000ab0 nRanks 96 busId 43000 e08r3n01:6277:8491 [1] NCCL INFO Connected all trees comm 0x2ba5b0000ab0 nRanks 96 busId 26000 e08r3n01:6278:8493 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6278:8493 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n01:6277:8491 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n01:6277:8491 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8675:11338 [0] NCCL INFO Connected all trees comm 0x2b43d0000ab0 nRanks 96 busId 4000 e08r3n09:8675:11338 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8675:11338 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8677:11336 [1] NCCL INFO Connected all trees comm 0x2b45a8000ab0 nRanks 96 busId 26000 e08r3n09:8677:11336 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8677:11336 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n09:8678:11333 [2] NCCL INFO Connected all trees comm 0x2b235c000ab0 nRanks 96 busId 43000 e08r3n09:8678:11333 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r3n09:8678:11333 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:751:3479 [0] NCCL INFO Connected all trees comm 0x2b8398000ab0 nRanks 96 busId 4000 e08r2n18:751:3479 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:751:3479 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n18:753:3473 [1] NCCL INFO Connected all trees comm 0x2b3358000ab0 nRanks 96 busId 26000 e08r2n18:753:3473 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n18:753:3473 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21282:23955 [1] NCCL INFO Channel 00 : 37[26000] -> 36[4000] via P2P/IPC comm 0x2ac164000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO Channel 01 : 37[26000] -> 36[4000] via P2P/IPC comm 0x2ac164000ab0 nRanks 96 e08r2n10:872:3576 [0] NCCL INFO Connected all trees comm 0x2b62a4000ab0 nRanks 96 busId 4000 e08r2n10:872:3576 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:872:3576 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n10:874:3574 [1] NCCL INFO Connected all trees comm 0x2b20f0000ab0 nRanks 96 busId 26000 e08r2n10:874:3574 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n10:874:3574 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21280:23959 [0] NCCL INFO Connected all trees comm 0x2b01f0000ab0 nRanks 96 busId 4000 e08r2n17:21280:23959 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21280:23959 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21282:23955 [1] NCCL INFO Connected all trees comm 0x2ac164000ab0 nRanks 96 busId 26000 e08r2n09:27004:29648 [1] NCCL INFO Channel 00 : 5[26000] -> 4[4000] via P2P/IPC comm 0x2af944000ab0 nRanks 96 e08r2n17:21282:23955 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21282:23955 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n17:21283:23951 [2] NCCL INFO Connected all trees comm 0x2b9988000ab0 nRanks 96 busId 43000 e08r2n17:21283:23951 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n17:21283:23951 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27004:29648 [1] NCCL INFO Channel 01 : 5[26000] -> 4[4000] via P2P/IPC comm 0x2af944000ab0 nRanks 96 e08r2n09:27002:29647 [0] NCCL INFO Connected all trees comm 0x2b0f80000ab0 nRanks 96 busId 4000 e08r2n09:27002:29647 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27002:29647 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27005:29650 [2] NCCL INFO Connected all trees comm 0x2b40ac000ab0 nRanks 96 busId 43000 e08r2n09:27004:29648 [1] NCCL INFO Connected all trees comm 0x2af944000ab0 nRanks 96 busId 26000 e08r2n09:27004:29648 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27004:29648 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n09:27005:29650 [2] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n09:27005:29650 [2] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13442:16162 [0] NCCL INFO Connected all trees comm 0x2b4c88000ab0 nRanks 96 busId 4000 e08r2n16:13442:16162 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13442:16162 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n16:13444:16165 [1] NCCL INFO Connected all trees comm 0x2b03e8000ab0 nRanks 96 busId 26000 e08r2n16:13444:16165 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n16:13444:16165 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5136:8202 [0] NCCL INFO Connected all trees comm 0x2b30a8000ab0 nRanks 96 busId 4000 e08r2n08:5136:8202 [0] NCCL INFO Using tuning table 0 with LL128 disabled e08r2n08:5136:8202 [0] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5136:8202 [0] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r2n08:5140:8208 [1] NCCL INFO Connected all trees comm 0x2b3330000ab0 nRanks 96 busId 26000 e08r2n08:5140:8208 [1] NCCL INFO threadThresholds 8/8/64 | 768/8/64 | 8/8/256 e08r2n08:5140:8208 [1] NCCL INFO 2 coll channels, 2 p2p channels, 1 p2p channels per peer e08r3n03:22735:25423 [0] NCCL INFO comm 0x2b4768000ab0 rank 60 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n03:22738:25418 [2] NCCL INFO comm 0x2af6a0000ab0 rank 62 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n03:22739:25421 [3] NCCL INFO comm 0x2b0784000ab0 rank 63 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n03:22737:25417 [1] NCCL INFO comm 0x2ac904000ab0 rank 61 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29648:32286 [2] NCCL INFO comm 0x2b900c000ab0 rank 94 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29649:32285 [3] NCCL INFO comm 0x2ba94c000ab0 rank 95 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n11:29647:32289 [1] NCCL INFO comm 0x2abf74000ab0 rank 93 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9032:11812 [1] NCCL INFO comm 0x2af85c000ab0 rank 45 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5733:8341 [2] NCCL INFO comm 0x2ae954000ab0 rank 14 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n14:18195:20820 [2] NCCL INFO comm 0x2b7728000ab0 rank 26 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n14:18194:20823 [1] NCCL INFO comm 0x2b4618000ab0 rank 25 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n08:13438:16173 [3] NCCL INFO comm 0x2b2878000ab0 rank 83 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n08:13436:16169 [1] NCCL INFO comm 0x2b1bb8000ab0 rank 81 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5732:8346 [1] NCCL INFO comm 0x2b1404000ab0 rank 13 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n11:29645:32290 [0] NCCL INFO comm 0x2ac49c000ab0 rank 92 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23995:26735 [3] NCCL INFO comm 0x2b4d6c000ab0 rank 23 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23991:26733 [0] NCCL INFO comm 0x2b51f4000ab0 rank 20 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23994:26734 [2] NCCL INFO comm 0x2b5ff4000ab0 rank 22 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9033:11810 [2] NCCL INFO comm 0x2b0610000ab0 rank 46 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n19:9030:11813 [0] NCCL INFO comm 0x2ab5e8000ab0 rank 44 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n19:9034:11808 [3] NCCL INFO comm 0x2b6ba4000ab0 rank 47 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n00:14532:16701 [0] NCCL INFO comm 0x2ac0ac000ab0 rank 48 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n00:14535:16698 [2] NCCL INFO comm 0x2bb1cc000ab0 rank 50 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5730:8342 [0] NCCL INFO comm 0x2b7cc4000ab0 rank 12 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n14:18192:20826 [0] NCCL INFO comm 0x2b8b18000ab0 rank 24 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n00:14536:16697 [3] NCCL INFO comm 0x2b79d4000ab0 rank 51 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n08:13434:16175 [0] NCCL INFO comm 0x2abf58000ab0 rank 80 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n08:13437:16171 [2] NCCL INFO comm 0x2b919c000ab0 rank 82 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n11:5734:8345 [3] NCCL INFO comm 0x2b4320000ab0 rank 15 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n00:14534:16703 [1] NCCL INFO comm 0x2b8e34000ab0 rank 49 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n14:18196:20819 [3] NCCL INFO comm 0x2ab848000ab0 rank 27 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n13:23993:26732 [1] NCCL INFO comm 0x2b42c0000ab0 rank 21 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30404:32518 [2] NCCL INFO comm 0x2b6a10000ab0 rank 58 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30405:32517 [3] NCCL INFO comm 0x2b6b88000ab0 rank 59 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n02:30403:32523 [1] NCCL INFO comm 0x2ba378000ab0 rank 57 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n10:18786:21523 [1] NCCL INFO comm 0x2ac5c0000ab0 rank 89 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n01:6279:8492 [3] NCCL INFO comm 0x2aecbc000ab0 rank 55 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n01:6278:8493 [2] NCCL INFO comm 0x2b1280000ab0 rank 54 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n18:751:3479 [0] NCCL INFO comm 0x2b8398000ab0 rank 40 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n09:8679:11332 [3] NCCL INFO comm 0x2b0eac000ab0 rank 87 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:755:3474 [3] NCCL INFO comm 0x2b8210000ab0 rank 43 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n18:753:3473 [1] NCCL INFO comm 0x2b3358000ab0 rank 41 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n10:875:3571 [2] NCCL INFO comm 0x2afb28000ab0 rank 10 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n10:18784:21522 [0] NCCL INFO comm 0x2af26c000ab0 rank 88 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:876:3570 [3] NCCL INFO comm 0x2b2f70000ab0 rank 11 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:874:3574 [1] NCCL INFO comm 0x2b20f0000ab0 rank 9 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21282:23955 [1] NCCL INFO comm 0x2ac164000ab0 rank 37 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n02:30401:32525 [0] NCCL INFO comm 0x2badc0000ab0 rank 56 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n10:18787:21519 [2] NCCL INFO comm 0x2ae928000ab0 rank 90 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n09:27005:29650 [2] NCCL INFO comm 0x2b40ac000ab0 rank 6 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n10:18788:21518 [3] NCCL INFO comm 0x2adaac000ab0 rank 91 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n16:13446:16166 [3] NCCL INFO comm 0x2ac21c000ab0 rank 35 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n08:5136:8202 [0] NCCL INFO comm 0x2b30a8000ab0 rank 0 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n09:8678:11333 [2] NCCL INFO comm 0x2b235c000ab0 rank 86 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n08:5142:8204 [3] NCCL INFO comm 0x2ad70c000ab0 rank 3 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n08:5140:8208 [1] NCCL INFO comm 0x2b3330000ab0 rank 1 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n01:6275:8490 [0] NCCL INFO comm 0x2b899c000ab0 rank 52 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n01:6277:8491 [1] NCCL INFO comm 0x2ba5b0000ab0 rank 53 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n18:754:3475 [2] NCCL INFO comm 0x2b2c8c000ab0 rank 42 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r3n09:8675:11338 [0] NCCL INFO comm 0x2b43d0000ab0 rank 84 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n17:21284:23952 [3] NCCL INFO comm 0x2ba784000ab0 rank 39 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n10:872:3576 [0] NCCL INFO comm 0x2b62a4000ab0 rank 8 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r3n09:8677:11336 [1] NCCL INFO comm 0x2b45a8000ab0 rank 85 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21280:23959 [0] NCCL INFO comm 0x2b01f0000ab0 rank 36 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n09:27006:29649 [3] NCCL INFO comm 0x2b5948000ab0 rank 7 nranks 96 cudaDev 3 busId 63000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n09:27004:29648 [1] NCCL INFO comm 0x2af944000ab0 rank 5 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n09:27002:29647 [0] NCCL INFO comm 0x2b0f80000ab0 rank 4 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n16:13445:16161 [2] NCCL INFO comm 0x2b6a48000ab0 rank 34 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n17:21283:23951 [2] NCCL INFO comm 0x2b9988000ab0 rank 38 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n16:13442:16162 [0] NCCL INFO comm 0x2b4c88000ab0 rank 32 nranks 96 cudaDev 0 busId 4000 localSize 404 used 21107856 bytes - Init COMPLETE e08r2n08:5141:8206 [2] NCCL INFO comm 0x2b5e3c000ab0 rank 2 nranks 96 cudaDev 2 busId 43000 localSize 404 used 37885072 bytes - Init COMPLETE e08r2n16:13444:16165 [1] NCCL INFO comm 0x2b03e8000ab0 rank 33 nranks 96 cudaDev 1 busId 26000 localSize 404 used 37885072 bytes - Init COMPLETE {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 3.0074, 'learning_rate': 2e-05, 'epoch': 0.01} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 2.9718, 'learning_rate': 2e-05, 'epoch': 0.02} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.101, 'learning_rate': 2e-05, 'epoch': 0.03} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 3.1011, 'learning_rate': 2e-05, 'epoch': 0.04} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 2.9208, 'learning_rate': 2e-05, 'epoch': 0.05} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0314, 'learning_rate': 2e-05, 'epoch': 0.06} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.0256, 'learning_rate': 2e-05, 'epoch': 0.07} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1189, 'learning_rate': 2e-05, 'epoch': 0.08} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1081, 'learning_rate': 2e-05, 'epoch': 0.09} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.1934, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.0965, 'learning_rate': 2e-05, 'epoch': 0.1} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.051, 'learning_rate': 2e-05, 'epoch': 0.11} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0656, 'learning_rate': 2e-05, 'epoch': 0.12} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0683, 'learning_rate': 2e-05, 'epoch': 0.13} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0148, 'learning_rate': 2e-05, 'epoch': 0.14} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0335, 'learning_rate': 2e-05, 'epoch': 0.15} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 3.0988, 'learning_rate': 2e-05, 'epoch': 0.16} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.9974, 'learning_rate': 2e-05, 'epoch': 0.17} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.8795, 'learning_rate': 2e-05, 'epoch': 0.18} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.703, 'learning_rate': 2e-05, 'epoch': 0.19} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6742, 'learning_rate': 2e-05, 'epoch': 0.2} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6332, 'learning_rate': 2e-05, 'epoch': 0.21} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.6879, 'learning_rate': 2e-05, 'epoch': 0.22} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.5488, 'learning_rate': 2e-05, 'epoch': 0.23} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.6216, 'learning_rate': 2e-05, 'epoch': 0.24} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.7379, 'learning_rate': 2e-05, 'epoch': 0.25} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.8305, 'learning_rate': 2e-05, 'epoch': 0.26} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7921, 'learning_rate': 2e-05, 'epoch': 0.27} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.7182, 'learning_rate': 2e-05, 'epoch': 0.28} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.8326, 'learning_rate': 2e-05, 'epoch': 0.29} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.7274, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.744, 'learning_rate': 2e-05, 'epoch': 0.3} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.8546, 'learning_rate': 2e-05, 'epoch': 0.31} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.7992, 'learning_rate': 2e-05, 'epoch': 0.32} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.8527, 'learning_rate': 2e-05, 'epoch': 0.33} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.953, 'learning_rate': 2e-05, 'epoch': 0.34} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.9005, 'learning_rate': 2e-05, 'epoch': 0.35} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.7138, 'learning_rate': 2e-05, 'epoch': 0.36} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.6996, 'learning_rate': 2e-05, 'epoch': 0.37} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8428, 'learning_rate': 2e-05, 'epoch': 0.38} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.8423, 'learning_rate': 2e-05, 'epoch': 0.39} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.6133, 'learning_rate': 2e-05, 'epoch': 0.4} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.7442, 'learning_rate': 2e-05, 'epoch': 0.41} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.6613, 'learning_rate': 2e-05, 'epoch': 0.42} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.7664, 'learning_rate': 2e-05, 'epoch': 0.43} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.6138, 'learning_rate': 2e-05, 'epoch': 0.44} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.517, 'learning_rate': 2e-05, 'epoch': 0.45} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6726, 'learning_rate': 2e-05, 'epoch': 0.46} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6087, 'learning_rate': 2e-05, 'epoch': 0.47} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.6648, 'learning_rate': 2e-05, 'epoch': 0.48} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.5943, 'learning_rate': 2e-05, 'epoch': 0.49} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.8677, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.9309, 'learning_rate': 2e-05, 'epoch': 0.5} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.5724, 'learning_rate': 2e-05, 'epoch': 0.51} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.8314, 'learning_rate': 2e-05, 'epoch': 0.52} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.6957, 'learning_rate': 2e-05, 'epoch': 0.53} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.4999, 'learning_rate': 2e-05, 'epoch': 0.54} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.6508, 'learning_rate': 2e-05, 'epoch': 0.55} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.4469, 'learning_rate': 2e-05, 'epoch': 0.56} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.768, 'learning_rate': 2e-05, 'epoch': 0.57} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6756, 'learning_rate': 2e-05, 'epoch': 0.58} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.6645, 'learning_rate': 2e-05, 'epoch': 0.59} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.7557, 'learning_rate': 2e-05, 'epoch': 0.6} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.5535, 'learning_rate': 2e-05, 'epoch': 0.61} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.6781, 'learning_rate': 2e-05, 'epoch': 0.62} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.5942, 'learning_rate': 2e-05, 'epoch': 0.63} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.6047, 'learning_rate': 2e-05, 'epoch': 0.64} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.7512, 'learning_rate': 2e-05, 'epoch': 0.65} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.5335, 'learning_rate': 2e-05, 'epoch': 0.66} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.766, 'learning_rate': 2e-05, 'epoch': 0.67} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.664, 'learning_rate': 2e-05, 'epoch': 0.68} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.6321, 'learning_rate': 2e-05, 'epoch': 0.69} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.8106, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6122, 'learning_rate': 2e-05, 'epoch': 0.7} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.6623, 'learning_rate': 2e-05, 'epoch': 0.71} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7701, 'learning_rate': 2e-05, 'epoch': 0.72} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7783, 'learning_rate': 2e-05, 'epoch': 0.73} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.7757, 'learning_rate': 2e-05, 'epoch': 0.74} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.6474, 'learning_rate': 2e-05, 'epoch': 0.75} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.7175, 'learning_rate': 2e-05, 'epoch': 0.76} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.4948, 'learning_rate': 2e-05, 'epoch': 0.77} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.7146, 'learning_rate': 2e-05, 'epoch': 0.78} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6198, 'learning_rate': 2e-05, 'epoch': 0.79} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.6583, 'learning_rate': 2e-05, 'epoch': 0.8} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.7755, 'learning_rate': 2e-05, 'epoch': 0.81} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.6385, 'learning_rate': 2e-05, 'epoch': 0.82} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.5971, 'learning_rate': 2e-05, 'epoch': 0.83} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.6127, 'learning_rate': 2e-05, 'epoch': 0.84} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.5975, 'learning_rate': 2e-05, 'epoch': 0.85} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.6233, 'learning_rate': 2e-05, 'epoch': 0.86} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.5939, 'learning_rate': 2e-05, 'epoch': 0.87} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.6647, 'learning_rate': 2e-05, 'epoch': 0.88} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7393, 'learning_rate': 2e-05, 'epoch': 0.89} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7192, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.6178, 'learning_rate': 2e-05, 'epoch': 0.9} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.7352, 'learning_rate': 2e-05, 'epoch': 0.91} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.4345, 'learning_rate': 2e-05, 'epoch': 0.92} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5915, 'learning_rate': 2e-05, 'epoch': 0.93} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.5623, 'learning_rate': 2e-05, 'epoch': 0.94} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.4568, 'learning_rate': 2e-05, 'epoch': 0.95} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5584, 'learning_rate': 2e-05, 'epoch': 0.96} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5673, 'learning_rate': 2e-05, 'epoch': 0.97} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.5086, 'learning_rate': 2e-05, 'epoch': 0.98} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.56, 'learning_rate': 2e-05, 'epoch': 0.99} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.5144, 'learning_rate': 2e-05, 'epoch': 1.0} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.196, 'learning_rate': 2e-05, 'epoch': 1.01} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 2.0514, 'learning_rate': 2e-05, 'epoch': 1.02} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9928, 'learning_rate': 2e-05, 'epoch': 1.03} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 1.9547, 'learning_rate': 2e-05, 'epoch': 1.04} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0976, 'learning_rate': 2e-05, 'epoch': 1.05} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 2.0057, 'learning_rate': 2e-05, 'epoch': 1.06} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.8813, 'learning_rate': 2e-05, 'epoch': 1.07} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.08} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 2.0039, 'learning_rate': 2e-05, 'epoch': 1.09} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9782, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9524, 'learning_rate': 2e-05, 'epoch': 1.1} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 1.9815, 'learning_rate': 2e-05, 'epoch': 1.11} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.0192, 'learning_rate': 2e-05, 'epoch': 1.12} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.2164, 'learning_rate': 2e-05, 'epoch': 1.13} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 2.0539, 'learning_rate': 2e-05, 'epoch': 1.14} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.9541, 'learning_rate': 2e-05, 'epoch': 1.15} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.907, 'learning_rate': 2e-05, 'epoch': 1.16} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9438, 'learning_rate': 2e-05, 'epoch': 1.17} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.9396, 'learning_rate': 2e-05, 'epoch': 1.18} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8725, 'learning_rate': 2e-05, 'epoch': 1.19} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 1.8599, 'learning_rate': 2e-05, 'epoch': 1.2} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.1224, 'learning_rate': 2e-05, 'epoch': 1.21} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 2.0364, 'learning_rate': 2e-05, 'epoch': 1.22} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.9687, 'learning_rate': 2e-05, 'epoch': 1.23} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 1.8761, 'learning_rate': 2e-05, 'epoch': 1.24} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 2.1039, 'learning_rate': 2e-05, 'epoch': 1.25} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.9864, 'learning_rate': 2e-05, 'epoch': 1.26} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 1.994, 'learning_rate': 2e-05, 'epoch': 1.27} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 2.0454, 'learning_rate': 2e-05, 'epoch': 1.28} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 1.9142, 'learning_rate': 2e-05, 'epoch': 1.29} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 1.8799, 'learning_rate': 2e-05, 'epoch': 1.3} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 2.0278, 'learning_rate': 2e-05, 'epoch': 1.31} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.8938, 'learning_rate': 2e-05, 'epoch': 1.32} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 1.9261, 'learning_rate': 2e-05, 'epoch': 1.33} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.018, 'learning_rate': 2e-05, 'epoch': 1.34} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0798, 'learning_rate': 2e-05, 'epoch': 1.35} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 2.0217, 'learning_rate': 2e-05, 'epoch': 1.36} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 1.9532, 'learning_rate': 2e-05, 'epoch': 1.37} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 2.1048, 'learning_rate': 2e-05, 'epoch': 1.38} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.8571, 'learning_rate': 2e-05, 'epoch': 1.39} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 1.9703, 'learning_rate': 2e-05, 'epoch': 1.4} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.1253, 'learning_rate': 2e-05, 'epoch': 1.41} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 2.063, 'learning_rate': 2e-05, 'epoch': 1.42} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9485, 'learning_rate': 2e-05, 'epoch': 1.43} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.9684, 'learning_rate': 2e-05, 'epoch': 1.44} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 1.967, 'learning_rate': 2e-05, 'epoch': 1.45} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0325, 'learning_rate': 2e-05, 'epoch': 1.46} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 2.0336, 'learning_rate': 2e-05, 'epoch': 1.47} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 1.9162, 'learning_rate': 2e-05, 'epoch': 1.48} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.0501, 'learning_rate': 2e-05, 'epoch': 1.49} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 2.1049, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.5} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 1.9727, 'learning_rate': 2e-05, 'epoch': 1.51} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 2.1257, 'learning_rate': 2e-05, 'epoch': 1.52} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9947, 'learning_rate': 2e-05, 'epoch': 1.53} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9176, 'learning_rate': 2e-05, 'epoch': 1.54} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 1.9117, 'learning_rate': 2e-05, 'epoch': 1.55} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0693, 'learning_rate': 2e-05, 'epoch': 1.56} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.0548, 'learning_rate': 2e-05, 'epoch': 1.57} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 2.106, 'learning_rate': 2e-05, 'epoch': 1.58} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 1.9293, 'learning_rate': 2e-05, 'epoch': 1.59} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.1129, 'learning_rate': 2e-05, 'epoch': 1.6} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0234, 'learning_rate': 2e-05, 'epoch': 1.61} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0279, 'learning_rate': 2e-05, 'epoch': 1.62} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.0498, 'learning_rate': 2e-05, 'epoch': 1.63} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 2.15, 'learning_rate': 2e-05, 'epoch': 1.64} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.9251, 'learning_rate': 2e-05, 'epoch': 1.65} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 1.8976, 'learning_rate': 2e-05, 'epoch': 1.66} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0163, 'learning_rate': 2e-05, 'epoch': 1.67} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 2.0119, 'learning_rate': 2e-05, 'epoch': 1.68} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 1.854, 'learning_rate': 2e-05, 'epoch': 1.69} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0104, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.1058, 'learning_rate': 2e-05, 'epoch': 1.7} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0002, 'learning_rate': 2e-05, 'epoch': 1.71} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 2.0537, 'learning_rate': 2e-05, 'epoch': 1.72} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9804, 'learning_rate': 2e-05, 'epoch': 1.73} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 1.9399, 'learning_rate': 2e-05, 'epoch': 1.74} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 2.0516, 'learning_rate': 2e-05, 'epoch': 1.75} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.9135, 'learning_rate': 2e-05, 'epoch': 1.76} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 1.988, 'learning_rate': 2e-05, 'epoch': 1.77} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 2.0287, 'learning_rate': 2e-05, 'epoch': 1.78} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 1.8886, 'learning_rate': 2e-05, 'epoch': 1.79} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 2.0572, 'learning_rate': 2e-05, 'epoch': 1.8} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 1.9742, 'learning_rate': 2e-05, 'epoch': 1.81} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0112, 'learning_rate': 2e-05, 'epoch': 1.82} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 2.0405, 'learning_rate': 2e-05, 'epoch': 1.83} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9959, 'learning_rate': 2e-05, 'epoch': 1.84} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9963, 'learning_rate': 2e-05, 'epoch': 1.85} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 1.9995, 'learning_rate': 2e-05, 'epoch': 1.86} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 2.0961, 'learning_rate': 2e-05, 'epoch': 1.87} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 1.9971, 'learning_rate': 2e-05, 'epoch': 1.88} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0856, 'learning_rate': 2e-05, 'epoch': 1.89} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0359, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0212, 'learning_rate': 2e-05, 'epoch': 1.9} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0885, 'learning_rate': 2e-05, 'epoch': 1.91} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0576, 'learning_rate': 2e-05, 'epoch': 1.92} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 2.0034, 'learning_rate': 2e-05, 'epoch': 1.93} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 1.8261, 'learning_rate': 2e-05, 'epoch': 1.94} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.002, 'learning_rate': 2e-05, 'epoch': 1.95} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.0309, 'learning_rate': 2e-05, 'epoch': 1.96} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.014, 'learning_rate': 2e-05, 'epoch': 1.97} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 2.1139, 'learning_rate': 2e-05, 'epoch': 1.98} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.9854, 'learning_rate': 2e-05, 'epoch': 1.99} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.7357, 'learning_rate': 2e-05, 'epoch': 2.0} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.4515, 'learning_rate': 2e-05, 'epoch': 2.01} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2709, 'learning_rate': 2e-05, 'epoch': 2.02} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2579, 'learning_rate': 2e-05, 'epoch': 2.03} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.2997, 'learning_rate': 2e-05, 'epoch': 2.04} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.3373, 'learning_rate': 2e-05, 'epoch': 2.05} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.377, 'learning_rate': 2e-05, 'epoch': 2.06} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2084, 'learning_rate': 2e-05, 'epoch': 2.07} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2738, 'learning_rate': 2e-05, 'epoch': 2.08} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.2616, 'learning_rate': 2e-05, 'epoch': 2.09} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3439, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.2739, 'learning_rate': 2e-05, 'epoch': 2.1} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.3546, 'learning_rate': 2e-05, 'epoch': 2.11} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.2944, 'learning_rate': 2e-05, 'epoch': 2.12} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.3537, 'learning_rate': 2e-05, 'epoch': 2.13} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.2957, 'learning_rate': 2e-05, 'epoch': 2.14} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3213, 'learning_rate': 2e-05, 'epoch': 2.15} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.3394, 'learning_rate': 2e-05, 'epoch': 2.16} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.2459, 'learning_rate': 2e-05, 'epoch': 2.17} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3403, 'learning_rate': 2e-05, 'epoch': 2.18} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3336, 'learning_rate': 2e-05, 'epoch': 2.19} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.2} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3205, 'learning_rate': 2e-05, 'epoch': 2.21} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3413, 'learning_rate': 2e-05, 'epoch': 2.22} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.3254, 'learning_rate': 2e-05, 'epoch': 2.23} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.2684, 'learning_rate': 2e-05, 'epoch': 2.24} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.3131, 'learning_rate': 2e-05, 'epoch': 2.25} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.2199, 'learning_rate': 2e-05, 'epoch': 2.26} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.3389, 'learning_rate': 2e-05, 'epoch': 2.27} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.2217, 'learning_rate': 2e-05, 'epoch': 2.28} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.3375, 'learning_rate': 2e-05, 'epoch': 2.29} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2168, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.3267, 'learning_rate': 2e-05, 'epoch': 2.3} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.31} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.2711, 'learning_rate': 2e-05, 'epoch': 2.32} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.3214, 'learning_rate': 2e-05, 'epoch': 2.33} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.233, 'learning_rate': 2e-05, 'epoch': 2.34} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2523, 'learning_rate': 2e-05, 'epoch': 2.35} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.2286, 'learning_rate': 2e-05, 'epoch': 2.36} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3709, 'learning_rate': 2e-05, 'epoch': 2.37} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.3404, 'learning_rate': 2e-05, 'epoch': 2.38} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.2885, 'learning_rate': 2e-05, 'epoch': 2.39} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3858, 'learning_rate': 2e-05, 'epoch': 2.4} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3512, 'learning_rate': 2e-05, 'epoch': 2.41} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3298, 'learning_rate': 2e-05, 'epoch': 2.42} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3342, 'learning_rate': 2e-05, 'epoch': 2.43} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3715, 'learning_rate': 2e-05, 'epoch': 2.44} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.3386, 'learning_rate': 2e-05, 'epoch': 2.45} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2864, 'learning_rate': 2e-05, 'epoch': 2.46} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.2937, 'learning_rate': 2e-05, 'epoch': 2.47} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.1762, 'learning_rate': 2e-05, 'epoch': 2.48} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.2814, 'learning_rate': 2e-05, 'epoch': 2.49} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.3049, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.4325, 'learning_rate': 2e-05, 'epoch': 2.5} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2729, 'learning_rate': 2e-05, 'epoch': 2.51} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2322, 'learning_rate': 2e-05, 'epoch': 2.52} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.2866, 'learning_rate': 2e-05, 'epoch': 2.53} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.3139, 'learning_rate': 2e-05, 'epoch': 2.54} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.55} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.2646, 'learning_rate': 2e-05, 'epoch': 2.56} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.4647, 'learning_rate': 2e-05, 'epoch': 2.57} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3428, 'learning_rate': 2e-05, 'epoch': 2.58} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.3536, 'learning_rate': 2e-05, 'epoch': 2.59} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.6} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.3249, 'learning_rate': 2e-05, 'epoch': 2.61} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.2609, 'learning_rate': 2e-05, 'epoch': 2.62} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.3228, 'learning_rate': 2e-05, 'epoch': 2.63} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.2768, 'learning_rate': 2e-05, 'epoch': 2.64} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3281, 'learning_rate': 2e-05, 'epoch': 2.65} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3497, 'learning_rate': 2e-05, 'epoch': 2.66} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3671, 'learning_rate': 2e-05, 'epoch': 2.67} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.3748, 'learning_rate': 2e-05, 'epoch': 2.68} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.318, 'learning_rate': 2e-05, 'epoch': 2.69} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2901, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.2674, 'learning_rate': 2e-05, 'epoch': 2.7} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.3522, 'learning_rate': 2e-05, 'epoch': 2.71} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.372, 'learning_rate': 2e-05, 'epoch': 2.72} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.2824, 'learning_rate': 2e-05, 'epoch': 2.73} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.3092, 'learning_rate': 2e-05, 'epoch': 2.74} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.339, 'learning_rate': 2e-05, 'epoch': 2.75} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.2787, 'learning_rate': 2e-05, 'epoch': 2.76} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3493, 'learning_rate': 2e-05, 'epoch': 2.77} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3189, 'learning_rate': 2e-05, 'epoch': 2.78} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3947, 'learning_rate': 2e-05, 'epoch': 2.79} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.3981, 'learning_rate': 2e-05, 'epoch': 2.8} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2571, 'learning_rate': 2e-05, 'epoch': 2.81} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.2829, 'learning_rate': 2e-05, 'epoch': 2.82} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3774, 'learning_rate': 2e-05, 'epoch': 2.83} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3975, 'learning_rate': 2e-05, 'epoch': 2.84} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.3457, 'learning_rate': 2e-05, 'epoch': 2.85} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.398, 'learning_rate': 2e-05, 'epoch': 2.86} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3567, 'learning_rate': 2e-05, 'epoch': 2.87} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.3209, 'learning_rate': 2e-05, 'epoch': 2.88} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.436, 'learning_rate': 2e-05, 'epoch': 2.89} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.2995, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.36, 'learning_rate': 2e-05, 'epoch': 2.9} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3351, 'learning_rate': 2e-05, 'epoch': 2.91} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3399, 'learning_rate': 2e-05, 'epoch': 2.92} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.3669, 'learning_rate': 2e-05, 'epoch': 2.93} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.2785, 'learning_rate': 2e-05, 'epoch': 2.94} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3644, 'learning_rate': 2e-05, 'epoch': 2.95} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3627, 'learning_rate': 2e-05, 'epoch': 2.96} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3398, 'learning_rate': 2e-05, 'epoch': 2.97} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3788, 'learning_rate': 2e-05, 'epoch': 2.98} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.3488, 'learning_rate': 2e-05, 'epoch': 2.99} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 1.113, 'learning_rate': 2e-05, 'epoch': 3.0} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.8322, 'learning_rate': 2e-05, 'epoch': 3.01} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.844, 'learning_rate': 2e-05, 'epoch': 3.02} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.7831, 'learning_rate': 2e-05, 'epoch': 3.03} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.04} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.755, 'learning_rate': 2e-05, 'epoch': 3.05} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7481, 'learning_rate': 2e-05, 'epoch': 3.06} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.7076, 'learning_rate': 2e-05, 'epoch': 3.07} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.8271, 'learning_rate': 2e-05, 'epoch': 3.08} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.7923, 'learning_rate': 2e-05, 'epoch': 3.09} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8009, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.7911, 'learning_rate': 2e-05, 'epoch': 3.1} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.8084, 'learning_rate': 2e-05, 'epoch': 3.11} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.6808, 'learning_rate': 2e-05, 'epoch': 3.12} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.8076, 'learning_rate': 2e-05, 'epoch': 3.13} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7355, 'learning_rate': 2e-05, 'epoch': 3.14} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7254, 'learning_rate': 2e-05, 'epoch': 3.15} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7739, 'learning_rate': 2e-05, 'epoch': 3.16} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7981, 'learning_rate': 2e-05, 'epoch': 3.17} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7642, 'learning_rate': 2e-05, 'epoch': 3.18} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.19} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.2} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7646, 'learning_rate': 2e-05, 'epoch': 3.21} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7001, 'learning_rate': 2e-05, 'epoch': 3.22} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.7356, 'learning_rate': 2e-05, 'epoch': 3.23} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8122, 'learning_rate': 2e-05, 'epoch': 3.24} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.8434, 'learning_rate': 2e-05, 'epoch': 3.25} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7732, 'learning_rate': 2e-05, 'epoch': 3.26} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.7806, 'learning_rate': 2e-05, 'epoch': 3.27} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.8449, 'learning_rate': 2e-05, 'epoch': 3.28} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7957, 'learning_rate': 2e-05, 'epoch': 3.29} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.7905, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8118, 'learning_rate': 2e-05, 'epoch': 3.3} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.8295, 'learning_rate': 2e-05, 'epoch': 3.31} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.7947, 'learning_rate': 2e-05, 'epoch': 3.32} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.8046, 'learning_rate': 2e-05, 'epoch': 3.33} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7046, 'learning_rate': 2e-05, 'epoch': 3.34} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7492, 'learning_rate': 2e-05, 'epoch': 3.35} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7847, 'learning_rate': 2e-05, 'epoch': 3.36} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7721, 'learning_rate': 2e-05, 'epoch': 3.37} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7348, 'learning_rate': 2e-05, 'epoch': 3.38} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.7685, 'learning_rate': 2e-05, 'epoch': 3.39} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.8034, 'learning_rate': 2e-05, 'epoch': 3.4} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7863, 'learning_rate': 2e-05, 'epoch': 3.41} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7507, 'learning_rate': 2e-05, 'epoch': 3.42} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.7681, 'learning_rate': 2e-05, 'epoch': 3.43} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.6975, 'learning_rate': 2e-05, 'epoch': 3.44} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.7536, 'learning_rate': 2e-05, 'epoch': 3.45} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.8365, 'learning_rate': 2e-05, 'epoch': 3.46} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.809, 'learning_rate': 2e-05, 'epoch': 3.47} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8415, 'learning_rate': 2e-05, 'epoch': 3.48} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8058, 'learning_rate': 2e-05, 'epoch': 3.49} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.8516, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7523, 'learning_rate': 2e-05, 'epoch': 3.5} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.7196, 'learning_rate': 2e-05, 'epoch': 3.51} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.8059, 'learning_rate': 2e-05, 'epoch': 3.52} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7867, 'learning_rate': 2e-05, 'epoch': 3.53} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7444, 'learning_rate': 2e-05, 'epoch': 3.54} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.7696, 'learning_rate': 2e-05, 'epoch': 3.55} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.8079, 'learning_rate': 2e-05, 'epoch': 3.56} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.7156, 'learning_rate': 2e-05, 'epoch': 3.57} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.811, 'learning_rate': 2e-05, 'epoch': 3.58} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.783, 'learning_rate': 2e-05, 'epoch': 3.59} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8232, 'learning_rate': 2e-05, 'epoch': 3.6} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8344, 'learning_rate': 2e-05, 'epoch': 3.61} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.8573, 'learning_rate': 2e-05, 'epoch': 3.62} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7692, 'learning_rate': 2e-05, 'epoch': 3.63} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.7515, 'learning_rate': 2e-05, 'epoch': 3.64} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8301, 'learning_rate': 2e-05, 'epoch': 3.65} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8599, 'learning_rate': 2e-05, 'epoch': 3.66} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8069, 'learning_rate': 2e-05, 'epoch': 3.67} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.8997, 'learning_rate': 2e-05, 'epoch': 3.68} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.747, 'learning_rate': 2e-05, 'epoch': 3.69} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.8352, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7704, 'learning_rate': 2e-05, 'epoch': 3.7} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7737, 'learning_rate': 2e-05, 'epoch': 3.71} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7325, 'learning_rate': 2e-05, 'epoch': 3.72} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.7538, 'learning_rate': 2e-05, 'epoch': 3.73} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.8204, 'learning_rate': 2e-05, 'epoch': 3.74} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.7833, 'learning_rate': 2e-05, 'epoch': 3.75} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.922, 'learning_rate': 2e-05, 'epoch': 3.76} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8706, 'learning_rate': 2e-05, 'epoch': 3.77} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8191, 'learning_rate': 2e-05, 'epoch': 3.78} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.8133, 'learning_rate': 2e-05, 'epoch': 3.79} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.7762, 'learning_rate': 2e-05, 'epoch': 3.8} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8299, 'learning_rate': 2e-05, 'epoch': 3.81} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.8402, 'learning_rate': 2e-05, 'epoch': 3.82} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7884, 'learning_rate': 2e-05, 'epoch': 3.83} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7686, 'learning_rate': 2e-05, 'epoch': 3.84} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.7748, 'learning_rate': 2e-05, 'epoch': 3.85} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8029, 'learning_rate': 2e-05, 'epoch': 3.86} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.8096, 'learning_rate': 2e-05, 'epoch': 3.87} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7443, 'learning_rate': 2e-05, 'epoch': 3.88} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.7848, 'learning_rate': 2e-05, 'epoch': 3.89} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.737, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.8875, 'learning_rate': 2e-05, 'epoch': 3.9} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.7877, 'learning_rate': 2e-05, 'epoch': 3.91} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.846, 'learning_rate': 2e-05, 'epoch': 3.92} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8083, 'learning_rate': 2e-05, 'epoch': 3.93} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.8566, 'learning_rate': 2e-05, 'epoch': 3.94} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.7885, 'learning_rate': 2e-05, 'epoch': 3.95} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8519, 'learning_rate': 2e-05, 'epoch': 3.96} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8396, 'learning_rate': 2e-05, 'epoch': 3.97} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8253, 'learning_rate': 2e-05, 'epoch': 3.98} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.8756, 'learning_rate': 2e-05, 'epoch': 3.99} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'loss': 0.5905, 'learning_rate': 2e-05, 'epoch': 4.0} {'train_runtime': 24950.7967, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.8037, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.6945, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7972, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7784, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7825, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7796, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7761, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7783, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7805, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.8068, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7974, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.791, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.8117, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7412, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7957, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7719, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7982, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7787, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.801, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7957, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.787, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.7777, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0} {'train_runtime': 24950.8044, 'train_samples_per_second': 1.603, 'train_steps_per_second': 0.017, 'train_loss': 1.7131820563759124, 'epoch': 4.0}