0: WARNING 26-04-29 01:17:31.917061 - 0:00:00 - Signal handler installed. 0: WARNING 26-04-29 01:17:31.917445 - 0:00:00 - WARNING: Setting MKL_SERVICE_FORCE_INTEL to GNU 0: WARNING 26-04-29 01:17:31.917532 - 0:00:00 - WARNING: Setting MKL_NUM_THREADS to 1 0: WARNING 26-04-29 01:17:31.917596 - 0:00:00 - WARNING: Setting ENABLE_INTRA_NODE_COMM to 1 0: WARNING 26-04-29 01:17:31.917647 - 0:00:00 - WARNING: Setting TORCH_NCCL_AVOID_RECORD_STREAMS to 1 0: WARNING 26-04-29 01:17:31.917696 - 0:00:00 - WARNING: Setting NCCL_IB_TIMEOUT to 22 0: WARNING 26-04-29 01:17:31.917741 - 0:00:00 - WARNING: Setting NCCL_DEBUG to INFO 0: WARNING 26-04-29 01:17:31.917785 - 0:00:00 - WARNING: Setting TRITON_CACHE_DIR to /scratch/local/xun/tmp/tmph8ew25jc 0: INFO 26-04-29 01:17:41.821640 - 0:00:10 - Run launched with torchrun, local rank: 0 0: INFO 26-04-29 01:17:41.822359 - 0:00:10 - ENV: environ({'SHELL': '/bin/bash', '__EGL_VENDOR_LIBRARY_DIRS': '/home/xun/anaconda3/share/glvnd/egl_vendor.d', 'COLORTERM': 'truecolor', 'SLURM_STEP_NUM_TASKS': '4', 'PYENV_SHELL': 'bash', 'SLURM_JOB_USER': 'xun', 'SLURM_TASKS_PER_NODE': '1(x4)', 'PYTHONUNBUFFERED': '1', 'SLURM_JOB_UID': '1005', 'OLD_PATH': '/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/shims:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'SLURM_STEP_GPUS': '0,1,2,3,4,5,6,7', 'NVM_INC': '/home/xun/.nvm/versions/node/v22.22.2/include/node', 'TERM_PROGRAM_VERSION': '3.1.15', 'SLURM_CPU_BIND': 'quiet,mask_cpu:0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'HPCX_HCOLL_DIR': '/opt/hpcx/hcoll', 'SLURM_TASK_PID': '1059988', 'CONDA_EXE': '/home/xun/anaconda3/bin/conda', '_CE_M': '', 'PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'SLURM_JOB_GPUS': '0,1,2,3,4,5,6,7', 'SLURM_LOCALID': '0', 'PYTHONNOUSERSITE': '1', 'SLURM_SUBMIT_DIR': '/home/xun/rsadhukh/STEM', 'SLURM_CPU_BIND_VERBOSE': 'quiet', 'HOSTNAME': 'compute-node-14', 'HPCX_CLUSTERKIT_DIR': '/opt/hpcx/clusterkit', 'SLURMD_NODENAME': 'compute-node-14', 'MASTER_PORT': '29500', 'SLURM_JOB_START_TIME': '1777425423', 'TORCH_NCCL_TIMEOUT': '1200', 'HYDRA_LAUNCHER_EXTRA_ARGS': '--external-launcher', 'OMPI_HOME': '/opt/hpcx/ompi', 'HPCX_OSU_CUDA_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks-cuda', 'SLURM_STEP_NODELIST': 'compute-node-[14,0,43-44]', 'TRAINING_LOG_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'WANDB_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'SLURM_CLUSTER_NAME': 'cluster', 'SLURM_JOB_END_TIME': '1777598223', 'SLURM_CPUS_ON_NODE': '128', 'SLURM_UMASK': '0000', 'HPCX_OSU_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks', 'SLURM_JOB_CPUS_PER_NODE': '128(x4)', 'HPCX_MPI_DIR': '/opt/hpcx/ompi', 'HPCX_OSHMEM_DIR': '/opt/hpcx/ompi', 'SLURM_GPUS_ON_NODE': '8', 'PWD': '/home/xun/rsadhukh/STEM', 'HPCX_UCC_DIR': '/opt/hpcx/ucc', 'PRTE_MCA_plm_slurm_args': '--external-launcher', 'SLURM_GTIDS': '0', 'GSETTINGS_SCHEMA_DIR': '/home/xun/anaconda3/share/glib-2.0/schemas', 'LOGNAME': 'xun', 'XDG_SESSION_TYPE': 'tty', 'CONDA_PREFIX': '/home/xun/anaconda3', 'SLURM_JOB_PARTITION': 'high', 'MODULESHOME': '/usr/share/modules', 'MANPATH': '/home/xun/.nvm/versions/node/v22.22.2/share/man::', 'SLURM_TRES_PER_TASK': 'cpu:128', 'GK_GL_PATH': '/tmp/gitkraken/gitlens/gitlens-ipc-server-4040699-45715.json', 'GSETTINGS_SCHEMA_DIR_CONDA_BACKUP': '', 'SLURM_JOB_NUM_NODES': '4', 'GK_GL_ADDR': 'http://127.0.0.1:45715', 'SRUN_DEBUG': '3', 'SLURM_STEPID': '0', 'SLURM_CPU_BIND_LIST': '0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'VSCODE_GIT_ASKPASS_NODE': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/node', 'SLURM_JOBID': '29496', 'GLOO_SOCKET_IFNAME': 'ens7', 'WORLD_SIZE': '32', 'SLURM_LAUNCH_NODE_IPADDR': '172.27.49.7', 'I_MPI_HYDRA_BOOTSTRAP_EXEC_EXTRA_ARGS': '--external-launcher', 'OLD_PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'MPI_HOME': '/opt/hpcx/ompi', 'MOTD_SHOWN': 'pam', 'TORCH_LOGS': 'recompiles,graph_breaks,dynamo,inductor', 'HOME': '/home/xun', 'LANG': 'C.UTF-8', 'SLURM_CPU_BIND_TYPE': 'mask_cpu:', 'LS_COLORS': 'rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.webp=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:', 'OSHMEM_HOME': '/opt/hpcx/ompi', 'SLURMD_DEBUG': '2', 'SLURM_PROCID': '0', 'OLD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'VIRTUAL_ENV': '/home/xun/rsadhukh/STEM/stem', 'SSL_CERT_DIR': '/usr/lib/ssl/certs', 'HPCX_UCX_DIR': '/opt/hpcx/ucx', 'CONDA_PROMPT_MODIFIER': '(base) ', 'TMPDIR': '/scratch/local/xun/tmp', 'GIT_ASKPASS': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass.sh', 'VSCODE_GIT_IPC_AUTH_TOKEN': '7ad9d34ebdd8f3e4e953f48f0f39d194dc1fec5170a626734328d81e9c14d270', 'SLURM_CPUS_PER_TASK': '128', 'SLURM_NTASKS': '4', 'CONFIG_PATH': 'apps/main/configs/olmo2_1B_midfine.yaml', 'SLURM_TOPOLOGY_ADDR': 'compute-node-14', 'SSH_CONNECTION': '67.163.187.8 57991 172.27.51.97 22', 'OLD_CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'SLURM_DISTRIBUTION': 'cyclic', 'ROOT_MODEL_DIR': '/data/rsadhukh/checkpoints', 'PYTORCH_CUDA_ALLOC_CONF': 'expandable_segments:True', 'HYDRA_BOOTSTRAP': 'slurm', 'SHMEM_HOME': '/opt/hpcx/ompi', 'NVM_DIR': '/home/xun/.nvm', 'MASTER_ADDR': 'compute-node-14', 'VSCODE_GIT_ASKPASS_EXTRA_ARGS': '', 'CUDA_VISIBLE_DEVICES': '0,1,2,3,4,5,6,7', 'SLURM_TOPOLOGY_ADDR_PATTERN': 'node', 'SLURM_SRUN_COMM_HOST': '172.27.49.7', '_CONDA_EXE': '/home/xun/anaconda3/bin/conda', 'LESSCLOSE': '/usr/bin/lesspipe %s %s', '_CONDA_ROOT': '/home/xun/anaconda3', 'XDG_SESSION_CLASS': 'user', 'PYTHONPATH': '/home/xun/rsadhukh/STEM:', 'TERM': 'xterm-256color', '_CE_CONDA': '', 'LESSOPEN': '| /usr/bin/lesspipe %s', 'USER': 'xun', 'LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'HPCX_SHARP_DIR': '/opt/hpcx/sharp', 'SLURM_NODELIST': 'compute-node-[14,0,43-44]', 'WANDB_API_KEY': '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', 'VSCODE_GIT_IPC_HANDLE': '/run/user/1005/vscode-git-c563716340.sock', 'ENVIRONMENT': 'BATCH', 'CONDA_SHLVL': '1', 'SLURM_SRUN_COMM_PORT': '44949', 'NODES': '4', 'EXP_NAME': 'midfine_base_final', 'LOADEDMODULES': '', 'TEMP': '/scratch/local/xun/tmp', 'SLURM_STEP_ID': '0', 'SLURM_PRIO_PROCESS': '0', 'SLURM_NPROCS': '4', 'SHLVL': '3', 'NVM_CD_FLAGS': '', 'SLURM_NNODES': '4', 'WANDB_MODE': 'online', 'HPCX_DIR': '/opt/hpcx', 'XDG_SESSION_ID': '1065', 'VIRTUAL_ENV_PROMPT': '(stem) ', 'TORCHINDUCTOR_COMPILE_THREADS': '32', 'SLURM_SUBMIT_HOST': 'login-node-0', 'CONDA_PYTHON_EXE': '/home/xun/anaconda3/bin/python', 'LD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'NCCL_IB_DISABLE': '0', 'XDG_RUNTIME_DIR': '/run/user/1005', 'SLURM_JOB_ID': '29496', 'SSL_CERT_FILE': '/usr/lib/ssl/certs/ca-certificates.crt', 'SLURM_NODEID': '0', 'PS1': '(stem) ', 'SLURM_STEP_NUM_NODES': '4', 'SSH_CLIENT': '67.163.187.8 57991 22', 'CONDA_DEFAULT_ENV': 'base', 'PYENV_ROOT': '/opt/pyenv', 'OPAL_PREFIX': '/opt/hpcx/ompi', 'OMP_NUM_THREADS': '1', 'OLD_LD_LIBRARY_PATH': '/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'SLURM_STEP_TASKS_PER_NODE': '1(x4)', 'WORLD_MODEL_LOG_LEVEL': 'DEBUG', 'VSCODE_GIT_ASKPASS_MAIN': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass-main.js', 'CUDA_HOME': '/usr/local/cuda-12.8', 'DATA_ROOT_DIR': '/home/xun/rsadhukh/STEM/data', 'XDG_DATA_DIRS': '/usr/local/share:/usr/share:/var/lib/snapd/desktop', 'NPROC_PER_NODE': '8', 'TORCH_FR_BUFFER_SIZE': '32', 'TMP': '/scratch/local/xun/tmp', 'BROWSER': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/helpers/browser.sh', 'SLURM_CONF': '/var/spool/slurmd/conf-cache/slurm.conf', 'PATH': '/home/xun/rsadhukh/STEM/stem/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/shims:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'HPCX_NCCL_RDMA_SHARP_PLUGIN_DIR': '/opt/hpcx/nccl_rdma_sharp_plugin', 'SLURM_JOB_NAME': 'stem', 'MODULEPATH': '/etc/environment-modules/modules:/usr/share/modules/versions:/usr/share/modules/$MODULE_VERSION/modulefiles:/usr/share/modules/modulefiles', 'SLURM_NTASKS_PER_NODE': '1', 'HPCX_MPI_TESTS_DIR': '/opt/hpcx/ompi/tests', 'DBUS_SESSION_BUS_ADDRESS': 'unix:path=/run/user/1005/bus', 'OLD_OPAL_PREFIX': '/opt/hpcx/ompi', 'NVM_BIN': '/home/xun/.nvm/versions/node/v22.22.2/bin', 'SLURM_STEP_LAUNCHER_PORT': '44949', 'OMPI_MCA_plm_slurm_args': '--external-launcher', 'SLURM_JOB_GID': '1005', 'CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'HF_ALLOW_CODE_EVAL': '1', 'OVSX_REGISTRY_URL': 'https://open-vsx.org', 'OLDPWD': '/home/xun/rsadhukh/STEM', 'SLURM_JOB_NODELIST': 'compute-node-[14,0,43-44]', 'MODULES_CMD': '/usr/lib/x86_64-linux-gnu/modulecmd.tcl', 'TERM_PROGRAM': 'vscode', 'SLURM_OUTPUT_MODE': 'standard', 'VSCODE_IPC_HOOK_CLI': '/run/user/1005/vscode-ipc-72e35561-a385-463f-9719-76416d7f3180.sock', 'I_MPI_HYDRA_BOOTSTRAP': 'slurm', 'BASH_FUNC_ml%%': '() { module ml "$@"\n}', 'BASH_FUNC_module%%': '() { eval `/usr/bin/tclsh8.6 /usr/lib/x86_64-linux-gnu/modulecmd.tcl bash "$@"`;\n _mlstatus=$?;\n return $_mlstatus\n}', '_': '/usr/bin/stdbuf', '_STDBUF_O': 'L', '_STDBUF_E': 'L', 'LD_PRELOAD': '/usr/libexec/coreutils/libstdbuf.so', 'LOCAL_RANK': '0', 'RANK': '0', 'GROUP_RANK': '0', 'ROLE_RANK': '0', 'ROLE_NAME': 'default', 'LOCAL_WORLD_SIZE': '8', 'GROUP_WORLD_SIZE': '4', 'ROLE_WORLD_SIZE': '32', 'TORCHELASTIC_RESTART_COUNT': '0', 'TORCHELASTIC_MAX_RESTARTS': '0', 'TORCHELASTIC_RUN_ID': 'none', 'TORCHELASTIC_USE_AGENT_STORE': 'True', 'TORCH_NCCL_ASYNC_ERROR_HANDLING': '1', 'TORCHELASTIC_ERROR_FILE': '/scratch/local/xun/tmp/torchelastic__l7hjh76/none_qxjr82kf/attempt_0/0/error.json', 'CUDA_MODULE_LOADING': 'LAZY', 'TORCHINDUCTOR_CACHE_DIR': '/scratch/local/xun/tmp/torchinductor_xun', 'KMP_DUPLICATE_LIB_OK': 'True', 'KMP_INIT_AT_FORK': 'FALSE', 'MKL_SERVICE_FORCE_INTEL': 'GNU', 'MKL_NUM_THREADS': '1', 'ENABLE_INTRA_NODE_COMM': '1', 'TORCH_NCCL_AVOID_RECORD_STREAMS': '1', 'NCCL_IB_TIMEOUT': '22', 'NCCL_DEBUG': 'INFO', 'TRITON_CACHE_DIR': '/scratch/local/xun/tmp/tmph8ew25jc'}) 0: INFO 26-04-29 01:17:47.053223 - 0:00:15 - Starting job: olmo2_1B_midfine 0: INFO 26-04-29 01:17:47.053496 - 0:00:15 - Running on dp rank : 0 0: INFO 26-04-29 01:17:47.053539 - 0:00:15 - Running on dp size : 32 0: INFO 26-04-29 01:17:47.053576 - 0:00:15 - Using model type: olmo3 (OLMo3LMTransformer) 0: INFO 26-04-29 01:17:47.055857 - 0:00:15 - Building model 0: INFO 26-04-29 01:17:47.070149 - 0:00:15 - Model is built ! 0: WARNING 26-04-29 01:17:47.260916 - 0:00:15 - Model parameter layers.0.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.261447 - 0:00:15 - Model parameter layers.0.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.261753 - 0:00:15 - Model parameter layers.0.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.262028 - 0:00:15 - Model parameter layers.0.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.262275 - 0:00:15 - Model parameter layers.0.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.262511 - 0:00:15 - Model parameter layers.0.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.262958 - 0:00:15 - Model parameter layers.0.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.263315 - 0:00:15 - Model parameter layers.0.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.263597 - 0:00:15 - Model parameter layers.0.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.263825 - 0:00:15 - Model parameter layers.0.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.264048 - 0:00:15 - Model parameter layers.0.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.264325 - 0:00:15 - Model parameter layers.1.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.264613 - 0:00:15 - Model parameter layers.1.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.264879 - 0:00:15 - Model parameter layers.1.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.265142 - 0:00:15 - Model parameter layers.1.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.265376 - 0:00:15 - Model parameter layers.1.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.265600 - 0:00:15 - Model parameter layers.1.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.265864 - 0:00:15 - Model parameter layers.1.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.266131 - 0:00:15 - Model parameter layers.1.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.266409 - 0:00:15 - Model parameter layers.1.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.266639 - 0:00:15 - Model parameter layers.1.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.266919 - 0:00:15 - Model parameter layers.1.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.267236 - 0:00:15 - Model parameter layers.2.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.267532 - 0:00:15 - Model parameter layers.2.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.267808 - 0:00:15 - Model parameter layers.2.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.268073 - 0:00:15 - Model parameter layers.2.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.268303 - 0:00:15 - Model parameter layers.2.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.268529 - 0:00:15 - Model parameter layers.2.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.268800 - 0:00:15 - Model parameter layers.2.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.269066 - 0:00:15 - Model parameter layers.2.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.269337 - 0:00:15 - Model parameter layers.2.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.269567 - 0:00:15 - Model parameter layers.2.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.269787 - 0:00:15 - Model parameter layers.2.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.270049 - 0:00:15 - Model parameter layers.3.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.270323 - 0:00:15 - Model parameter layers.3.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.270592 - 0:00:15 - Model parameter layers.3.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.271178 - 0:00:15 - Model parameter layers.3.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.271519 - 0:00:15 - Model parameter layers.3.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.271782 - 0:00:15 - Model parameter layers.3.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.272056 - 0:00:15 - Model parameter layers.3.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.272333 - 0:00:15 - Model parameter layers.3.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.272611 - 0:00:15 - Model parameter layers.3.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.272848 - 0:00:15 - Model parameter layers.3.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.273068 - 0:00:15 - Model parameter layers.3.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.273352 - 0:00:15 - Model parameter layers.4.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.273624 - 0:00:15 - Model parameter layers.4.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.273889 - 0:00:15 - Model parameter layers.4.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.274157 - 0:00:15 - Model parameter layers.4.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.274390 - 0:00:15 - Model parameter layers.4.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.274612 - 0:00:15 - Model parameter layers.4.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.275086 - 0:00:15 - Model parameter layers.4.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.275388 - 0:00:15 - Model parameter layers.4.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.275658 - 0:00:15 - Model parameter layers.4.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.275879 - 0:00:15 - Model parameter layers.4.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.276098 - 0:00:15 - Model parameter layers.4.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.276371 - 0:00:15 - Model parameter layers.5.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.276650 - 0:00:15 - Model parameter layers.5.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.276920 - 0:00:15 - Model parameter layers.5.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.277182 - 0:00:15 - Model parameter layers.5.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.277415 - 0:00:15 - Model parameter layers.5.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.277637 - 0:00:15 - Model parameter layers.5.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.277924 - 0:00:15 - Model parameter layers.5.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.278188 - 0:00:15 - Model parameter layers.5.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.278454 - 0:00:15 - Model parameter layers.5.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.278679 - 0:00:15 - Model parameter layers.5.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.278986 - 0:00:15 - Model parameter layers.5.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.279311 - 0:00:15 - Model parameter layers.6.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.279575 - 0:00:15 - Model parameter layers.6.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.279843 - 0:00:15 - Model parameter layers.6.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.280120 - 0:00:15 - Model parameter layers.6.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.280348 - 0:00:15 - Model parameter layers.6.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.280571 - 0:00:15 - Model parameter layers.6.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.280837 - 0:00:15 - Model parameter layers.6.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.281102 - 0:00:15 - Model parameter layers.6.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.281367 - 0:00:15 - Model parameter layers.6.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.281593 - 0:00:15 - Model parameter layers.6.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.281808 - 0:00:15 - Model parameter layers.6.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.282078 - 0:00:15 - Model parameter layers.7.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.282356 - 0:00:15 - Model parameter layers.7.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.282631 - 0:00:15 - Model parameter layers.7.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.282947 - 0:00:15 - Model parameter layers.7.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.283212 - 0:00:15 - Model parameter layers.7.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.283453 - 0:00:15 - Model parameter layers.7.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.283713 - 0:00:15 - Model parameter layers.7.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.283977 - 0:00:15 - Model parameter layers.7.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.284243 - 0:00:15 - Model parameter layers.7.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.284474 - 0:00:15 - Model parameter layers.7.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.284688 - 0:00:15 - Model parameter layers.7.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.284960 - 0:00:15 - Model parameter layers.8.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.285216 - 0:00:15 - Model parameter layers.8.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.285488 - 0:00:15 - Model parameter layers.8.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.285754 - 0:00:15 - Model parameter layers.8.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.285971 - 0:00:15 - Model parameter layers.8.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.286184 - 0:00:15 - Model parameter layers.8.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.286456 - 0:00:15 - Model parameter layers.8.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.286726 - 0:00:15 - Model parameter layers.8.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.287435 - 0:00:15 - Model parameter layers.8.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.287827 - 0:00:15 - Model parameter layers.8.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.288241 - 0:00:15 - Model parameter layers.8.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.288570 - 0:00:15 - Model parameter layers.9.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.288831 - 0:00:15 - Model parameter layers.9.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.289100 - 0:00:15 - Model parameter layers.9.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.289369 - 0:00:15 - Model parameter layers.9.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.289598 - 0:00:15 - Model parameter layers.9.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.289811 - 0:00:15 - Model parameter layers.9.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.290081 - 0:00:15 - Model parameter layers.9.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.290362 - 0:00:15 - Model parameter layers.9.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.290626 - 0:00:15 - Model parameter layers.9.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.290878 - 0:00:15 - Model parameter layers.9.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.291130 - 0:00:15 - Model parameter layers.9.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.291421 - 0:00:15 - Model parameter layers.10.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.291687 - 0:00:15 - Model parameter layers.10.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.291955 - 0:00:15 - Model parameter layers.10.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.292218 - 0:00:15 - Model parameter layers.10.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.292474 - 0:00:15 - Model parameter layers.10.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.292740 - 0:00:15 - Model parameter layers.10.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.293061 - 0:00:15 - Model parameter layers.10.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.293359 - 0:00:15 - Model parameter layers.10.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.293649 - 0:00:15 - Model parameter layers.10.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.293884 - 0:00:15 - Model parameter layers.10.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.294113 - 0:00:15 - Model parameter layers.10.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.294409 - 0:00:15 - Model parameter layers.11.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.294691 - 0:00:15 - Model parameter layers.11.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.295056 - 0:00:15 - Model parameter layers.11.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.295407 - 0:00:15 - Model parameter layers.11.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.295671 - 0:00:15 - Model parameter layers.11.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.295905 - 0:00:15 - Model parameter layers.11.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.296174 - 0:00:15 - Model parameter layers.11.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.296461 - 0:00:15 - Model parameter layers.11.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.296743 - 0:00:15 - Model parameter layers.11.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.296994 - 0:00:15 - Model parameter layers.11.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.297226 - 0:00:15 - Model parameter layers.11.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.297541 - 0:00:15 - Model parameter layers.12.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.297816 - 0:00:15 - Model parameter layers.12.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.298108 - 0:00:15 - Model parameter layers.12.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.298378 - 0:00:15 - Model parameter layers.12.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.298621 - 0:00:15 - Model parameter layers.12.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.298915 - 0:00:15 - Model parameter layers.12.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.299255 - 0:00:15 - Model parameter layers.12.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.299543 - 0:00:15 - Model parameter layers.12.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.299818 - 0:00:15 - Model parameter layers.12.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.300050 - 0:00:15 - Model parameter layers.12.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.300294 - 0:00:15 - Model parameter layers.12.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.300602 - 0:00:15 - Model parameter layers.13.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.300872 - 0:00:15 - Model parameter layers.13.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.301136 - 0:00:15 - Model parameter layers.13.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.301411 - 0:00:15 - Model parameter layers.13.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.301707 - 0:00:15 - Model parameter layers.13.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.301929 - 0:00:15 - Model parameter layers.13.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.302191 - 0:00:15 - Model parameter layers.13.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.302466 - 0:00:15 - Model parameter layers.13.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.302734 - 0:00:15 - Model parameter layers.13.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.303056 - 0:00:15 - Model parameter layers.13.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.303375 - 0:00:15 - Model parameter layers.13.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.303666 - 0:00:15 - Model parameter layers.14.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.303936 - 0:00:15 - Model parameter layers.14.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.304200 - 0:00:15 - Model parameter layers.14.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.304485 - 0:00:15 - Model parameter layers.14.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.304727 - 0:00:15 - Model parameter layers.14.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.305021 - 0:00:15 - Model parameter layers.14.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.305343 - 0:00:15 - Model parameter layers.14.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.305633 - 0:00:15 - Model parameter layers.14.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.305903 - 0:00:15 - Model parameter layers.14.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.306116 - 0:00:15 - Model parameter layers.14.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.306353 - 0:00:15 - Model parameter layers.14.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.306622 - 0:00:15 - Model parameter layers.15.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.306934 - 0:00:15 - Model parameter layers.15.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.307249 - 0:00:15 - Model parameter layers.15.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.307519 - 0:00:15 - Model parameter layers.15.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.307736 - 0:00:15 - Model parameter layers.15.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.307950 - 0:00:15 - Model parameter layers.15.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.308212 - 0:00:15 - Model parameter layers.15.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.308482 - 0:00:15 - Model parameter layers.15.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.308749 - 0:00:15 - Model parameter layers.15.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.308968 - 0:00:15 - Model parameter layers.15.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.309187 - 0:00:15 - Model parameter layers.15.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.309744 - 0:00:15 - Model parameter tok_embeddings.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.310005 - 0:00:15 - Model parameter norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.310305 - 0:00:15 - Model parameter output.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 01:17:47.310637 - 0:00:15 - Model parameter rope_embeddings.freqs_cis is all zeros: it might be because of a missing initialization 0: INFO 26-04-29 01:17:47.311307 - 0:00:15 - Model size: 1,484,916,736 total parameters 0: INFO 26-04-29 01:17:47.311812 - 0:00:15 - GPU capacity: NVIDIA H200 (0) with 139.80GiB memory 0: INFO 26-04-29 01:17:47.316593 - 0:00:15 - GPU memory usage: NVIDIA H200 (0): 139.80084228515625 GiB capacity, 0.208984375 GiB peak, 0.14948720736154641% peak 0: INFO 26-04-29 01:17:47.316718 - 0:00:15 - Starting build of optimizer... 0: INFO 26-04-29 01:17:47.317860 - 0:00:15 - Done with build of optimizer. 0: INFO 26-04-29 01:17:47.317947 - 0:00:15 - Using global DP dataloader sharding: rank 0/32 0: INFO 26-04-29 01:17:48.416554 - 0:00:16 - Loading initial model & optimizer from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ 0: DEBUG 26-04-29 01:18:01.900045 - 0:00:30 - Using selector: EpollSelector 0: DEBUG 26-04-29 01:18:02.063582 - 0:00:30 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 01:18:02.076767 - 0:00:30 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 01:18:02.081241 - 0:00:30 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 01:18:02.087405 - 0:00:30 - Popen(['git', 'rev-parse', '--show-toplevel'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 01:18:02.099947 - 0:00:30 - Starting new HTTPS connection (1): api.wandb.ai:443 0: DEBUG 26-04-29 01:18:02.771177 - 0:00:31 - https://api.wandb.ai:443 "POST /graphql HTTP/1.1" 200 None 0: DEBUG 26-04-29 01:18:03.086199 - 0:00:31 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 01:18:03.092567 - 0:00:31 - Popen(['git', 'cat-file', '--batch-check'], cwd=/home/xun/rsadhukh/STEM, stdin=, shell=False, universal_newlines=False) 0: INFO 26-04-29 01:18:04.282070 - 0:00:32 - Loading data loader... 0: WARNING 26-04-29 01:18:04.282961 - 0:00:32 - track_packed_source_mixture=True: source counts are updated in the dataloader process only; forcing synchronous dataloader (load_async=False) for this run. 0: INFO 26-04-29 01:18:04.283282 - 0:00:32 - Loaded data loader! 0: INFO 26-04-29 01:18:04.283981 - 0:00:32 - Profiling active. Traces will be saved at /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling 0: INFO 26-04-29 01:18:04.284841 - 0:00:32 - Creating trace directory /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling! 0: INFO 26-04-29 01:18:04.286509 - 0:00:32 - Created trace directory! 0: INFO 26-04-29 01:18:04.287098 - 0:00:32 - Waiting at profiler barrier... 0: INFO 26-04-29 01:18:04.287849 - 0:00:32 - Profiler barrier passed 0: INFO 26-04-29 01:18:05.275657 - 0:00:33 - Using vocab_size=100352 from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/config.json (tokenizer has 100278 tokens) 0: INFO 26-04-29 01:18:05.276922 - 0:00:33 - HuggingFace tokenizer loaded from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ – #words: 100352, BOS ID: 100257, EOS ID: 100257 0: INFO 26-04-29 01:19:57.625300 - 0:02:26 - garbage collection 0: INFO 26-04-29 01:20:11.907370 - 0:02:40 - step: 10 acc: 0 loss: 1.6466 grad: 2.54e-01 flops: 4.42e+13 wps: 5.14e+03 iter: 0.7936 data: 0.072 lr: 7.44e-05 mem: 54% pow: 548.149 W 0: INFO 26-04-29 01:20:25.279913 - 0:02:53 - step: 20 acc: 0 loss: 1.8358 grad: 1.88e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6168 data: 0.0611 lr: 7.44e-05 mem: 47% pow: 664.656 W 0: INFO 26-04-29 01:20:41.132521 - 0:03:09 - step: 30 acc: 0 loss: 1.835 grad: 1.66e-01 flops: 3.56e+14 wps: 4.13e+04 iter: 2.8493 data: 0.0623 lr: 7.44e-05 mem: 47% pow: 414.583 W 0: INFO 26-04-29 01:20:54.863283 - 0:03:23 - step: 40 acc: 0 loss: 1.9121 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6714 data: 0.0543 lr: 7.43e-05 mem: 47% pow: 635.793 W 0: INFO 26-04-29 01:21:08.299380 - 0:03:36 - Starting MemSnapshotsProfilerWandb profiler... 0: INFO 26-04-29 01:21:08.302192 - 0:03:36 - step: 50 acc: 0 loss: 1.7182 grad: 1.68e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6294 data: 0.0724 lr: 7.43e-05 mem: 47% pow: 640.701 W 0: INFO 26-04-29 01:21:09.635262 - 0:03:38 - Shutting down MemSnapshotsProfilerWandb profiler... 0: INFO 26-04-29 01:21:09.702489 - 0:03:38 - Starting PyTorchProfilerWandb profiler... 0: INFO 26-04-29 01:21:11.294774 - 0:03:39 - Shutting down PyTorchProfilerWandb profiler... 0: INFO 26-04-29 01:21:12.146409 - 0:03:40 - Begin analyze trace 0: INFO 26-04-29 01:21:12.474658 - 0:03:41 - End analyze trace 0: INFO 26-04-29 01:21:12.604616 - 0:03:41 - xFormers profiler done. summary: MemTrace : /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling/memory_trace_plot/000102_rank00_compute-node-14_1060320.html Step time (ms): 689 TFlop/step : 273.5 TFlops : 396.8 HFU : 0.000 MFU : 0.000 0: INFO 26-04-29 01:21:23.757336 - 0:03:52 - step: 60 acc: 0 loss: 1.7796 grad: 1.66e-01 flops: 3.65e+14 wps: 4.24e+04 iter: 0.6133 data: 0.0638 lr: 7.43e-05 mem: 47% pow: 659.071 W 0: INFO 26-04-29 01:21:39.672518 - 0:04:08 - step: 70 acc: 0 loss: 1.7176 grad: 1.61e-01 flops: 3.55e+14 wps: 4.12e+04 iter: 0.6259 data: 0.0682 lr: 7.43e-05 mem: 47% pow: 662.644 W 0: INFO 26-04-29 01:21:53.300752 - 0:04:21 - step: 80 acc: 0 loss: 1.778 grad: 1.64e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6174 data: 0.0627 lr: 7.43e-05 mem: 47% pow: 655.276 W 0: INFO 26-04-29 01:22:06.757781 - 0:04:35 - step: 90 acc: 0 loss: 1.6736 grad: 1.83e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6146 data: 0.0626 lr: 7.43e-05 mem: 47% pow: 661.813 W 0: INFO 26-04-29 01:22:20.371995 - 0:04:48 - step: 100 acc: 0 loss: 1.4958 grad: 1.84e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6838 data: 0.0662 lr: 7.43e-05 mem: 47% pow: 611.972 W 0: INFO 26-04-29 01:22:38.522356 - 0:05:07 - step: 110 acc: 0 loss: 1.7953 grad: 1.72e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.6252 data: 0.074 lr: 7.42e-05 mem: 54% pow: 654.432 W 0: INFO 26-04-29 01:22:52.283066 - 0:05:20 - step: 120 acc: 0 loss: 2.2684 grad: 1.60e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6012 data: 0.0804 lr: 7.42e-05 mem: 47% pow: 652.077 W 0: INFO 26-04-29 01:23:06.160466 - 0:05:34 - step: 130 acc: 0 loss: 1.6405 grad: 1.86e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6334 data: 0.0649 lr: 7.42e-05 mem: 47% pow: 650.74 W 0: INFO 26-04-29 01:23:19.636423 - 0:05:48 - step: 140 acc: 0 loss: 1.8374 grad: 1.75e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6493 data: 0.0579 lr: 7.42e-05 mem: 47% pow: 643.214 W 0: INFO 26-04-29 01:23:33.467218 - 0:06:02 - step: 150 acc: 0 loss: 1.8466 grad: 1.70e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6262 data: 0.073 lr: 7.42e-05 mem: 47% pow: 656.468 W 0: INFO 26-04-29 01:23:47.053135 - 0:06:15 - step: 160 acc: 0 loss: 1.4422 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6508 data: 0.0659 lr: 7.42e-05 mem: 47% pow: 641.153 W 0: INFO 26-04-29 01:24:00.540354 - 0:06:29 - step: 170 acc: 0 loss: 1.6924 grad: 1.62e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6262 data: 0.0584 lr: 7.41e-05 mem: 47% pow: 665.107 W 0: INFO 26-04-29 01:24:14.229630 - 0:06:42 - step: 180 acc: 0 loss: 1.8209 grad: 1.78e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.597 data: 0.0716 lr: 7.41e-05 mem: 47% pow: 672.139 W 0: INFO 26-04-29 01:24:27.913304 - 0:06:56 - step: 190 acc: 0 loss: 1.7277 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6167 data: 0.0567 lr: 7.41e-05 mem: 47% pow: 660.206 W 0: INFO 26-04-29 01:24:41.531507 - 0:07:10 - step: 200 acc: 0 loss: 1.6985 grad: 1.64e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5975 data: 0.0742 lr: 7.41e-05 mem: 47% pow: 669.235 W 0: INFO 26-04-29 01:24:57.834266 - 0:07:26 - step: 210 acc: 0 loss: 1.5684 grad: 1.58e-01 flops: 3.46e+14 wps: 4.02e+04 iter: 0.6071 data: 0.0646 lr: 7.41e-05 mem: 54% pow: 669.185 W 0: INFO 26-04-29 01:25:12.931504 - 0:07:41 - step: 220 acc: 0 loss: 1.811 grad: 1.94e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.6179 data: 0.0715 lr: 7.41e-05 mem: 47% pow: 663.796 W 0: INFO 26-04-29 01:25:26.697773 - 0:07:55 - step: 230 acc: 0 loss: 1.7285 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6588 data: 0.0667 lr: 7.41e-05 mem: 47% pow: 629.83 W 0: INFO 26-04-29 01:25:40.470082 - 0:08:09 - step: 240 acc: 0 loss: 1.4829 grad: 1.61e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6123 data: 0.0711 lr: 7.40e-05 mem: 47% pow: 680.222 W 0: INFO 26-04-29 01:25:53.803310 - 0:08:22 - step: 250 acc: 0 loss: 1.9218 grad: 1.62e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.6112 data: 0.0655 lr: 7.40e-05 mem: 47% pow: 651.149 W 0: INFO 26-04-29 01:26:07.529839 - 0:08:36 - step: 260 acc: 0 loss: 1.9647 grad: 1.76e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6013 data: 0.0733 lr: 7.40e-05 mem: 47% pow: 665.473 W 0: INFO 26-04-29 01:26:21.810028 - 0:08:50 - step: 270 acc: 0 loss: 1.6662 grad: 1.62e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6176 data: 0.0729 lr: 7.40e-05 mem: 47% pow: 651.924 W 0: INFO 26-04-29 01:26:35.911568 - 0:09:04 - step: 280 acc: 0 loss: 1.5621 grad: 1.62e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6405 data: 0.0689 lr: 7.40e-05 mem: 47% pow: 647.03 W 0: INFO 26-04-29 01:26:50.051349 - 0:09:18 - step: 290 acc: 0 loss: 1.6207 grad: 1.55e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6062 data: 0.0637 lr: 7.40e-05 mem: 47% pow: 663.187 W 0: INFO 26-04-29 01:27:03.675471 - 0:09:32 - step: 300 acc: 0 loss: 1.5634 grad: 1.75e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6819 data: 0.0693 lr: 7.40e-05 mem: 47% pow: 614.607 W 0: INFO 26-04-29 01:27:21.838152 - 0:09:50 - step: 310 acc: 0 loss: 1.5064 grad: 1.67e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.6447 data: 0.0732 lr: 7.39e-05 mem: 54% pow: 636.446 W 0: INFO 26-04-29 01:27:35.270595 - 0:10:03 - step: 320 acc: 0 loss: 1.6252 grad: 1.54e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6297 data: 0.0718 lr: 7.39e-05 mem: 47% pow: 641.586 W 0: INFO 26-04-29 01:27:48.871391 - 0:10:17 - step: 330 acc: 0 loss: 1.6676 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6489 data: 0.0827 lr: 7.39e-05 mem: 47% pow: 625.78 W 0: INFO 26-04-29 01:28:02.643541 - 0:10:31 - step: 340 acc: 0 loss: 1.7191 grad: 1.59e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6036 data: 0.0729 lr: 7.39e-05 mem: 47% pow: 667.593 W 0: INFO 26-04-29 01:28:17.742706 - 0:10:46 - step: 350 acc: 0 loss: 1.9012 grad: 1.62e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.7269 data: 0.0713 lr: 7.39e-05 mem: 47% pow: 585.429 W 0: INFO 26-04-29 01:28:31.421453 - 0:11:00 - step: 360 acc: 0 loss: 1.7073 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6107 data: 0.0703 lr: 7.39e-05 mem: 47% pow: 654.704 W 0: INFO 26-04-29 01:28:45.374508 - 0:11:13 - step: 370 acc: 0 loss: 1.8199 grad: 1.73e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6837 data: 0.0546 lr: 7.39e-05 mem: 47% pow: 626.736 W 0: INFO 26-04-29 01:28:59.379593 - 0:11:27 - step: 380 acc: 0 loss: 1.494 grad: 1.69e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.7277 data: 0.0721 lr: 7.38e-05 mem: 47% pow: 588.829 W 0: INFO 26-04-29 01:29:13.150120 - 0:11:41 - step: 390 acc: 0 loss: 1.7137 grad: 1.52e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.604 data: 0.0759 lr: 7.38e-05 mem: 47% pow: 652.149 W 0: INFO 26-04-29 01:29:26.903986 - 0:11:55 - step: 400 acc: 0 loss: 1.5857 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.621 data: 0.0637 lr: 7.38e-05 mem: 47% pow: 652.742 W 0: INFO 26-04-29 01:29:43.235510 - 0:12:11 - step: 410 acc: 0 loss: 1.9293 grad: 1.58e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.6251 data: 0.0623 lr: 7.38e-05 mem: 54% pow: 656.21 W 0: INFO 26-04-29 01:29:57.095204 - 0:12:25 - step: 420 acc: 0 loss: 2.0284 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6968 data: 0.0567 lr: 7.38e-05 mem: 47% pow: 622.514 W 0: INFO 26-04-29 01:30:10.778421 - 0:12:39 - step: 430 acc: 0 loss: 1.843 grad: 1.78e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6544 data: 0.075 lr: 7.38e-05 mem: 47% pow: 630.616 W 0: INFO 26-04-29 01:30:24.985320 - 0:12:53 - step: 440 acc: 0 loss: 1.9355 grad: 1.59e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6242 data: 0.0705 lr: 7.37e-05 mem: 47% pow: 654.443 W 0: INFO 26-04-29 01:30:38.318907 - 0:13:06 - step: 450 acc: 0 loss: 1.8857 grad: 1.62e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.6088 data: 0.0709 lr: 7.37e-05 mem: 47% pow: 651.036 W 0: INFO 26-04-29 01:30:51.811310 - 0:13:20 - step: 460 acc: 0 loss: 1.5857 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6013 data: 0.106 lr: 7.37e-05 mem: 47% pow: 639.803 W 0: INFO 26-04-29 01:31:06.550696 - 0:13:35 - step: 470 acc: 0 loss: 1.6336 grad: 1.55e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.618 data: 0.068 lr: 7.37e-05 mem: 47% pow: 656.73 W 0: INFO 26-04-29 01:31:20.109216 - 0:13:48 - step: 480 acc: 0 loss: 1.7931 grad: 1.54e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6327 data: 0.0579 lr: 7.37e-05 mem: 47% pow: 653.334 W 0: INFO 26-04-29 01:31:33.576848 - 0:14:02 - step: 490 acc: 0 loss: 1.5553 grad: 1.82e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6083 data: 0.0672 lr: 7.37e-05 mem: 47% pow: 658.851 W 0: INFO 26-04-29 01:31:47.347536 - 0:14:15 - step: 500 acc: 0 loss: 1.6015 grad: 1.68e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7322 data: 0.0692 lr: 7.37e-05 mem: 47% pow: 593.171 W 0: INFO 26-04-29 01:32:03.795861 - 0:14:32 - step: 510 acc: 0 loss: 2.0245 grad: 1.62e-01 flops: 3.43e+14 wps: 3.99e+04 iter: 0.6492 data: 0.0665 lr: 7.36e-05 mem: 54% pow: 633.745 W 0: INFO 26-04-29 01:32:17.398638 - 0:14:45 - step: 520 acc: 0 loss: 1.8947 grad: 1.74e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6102 data: 0.0632 lr: 7.36e-05 mem: 47% pow: 666.501 W 0: INFO 26-04-29 01:32:31.026773 - 0:14:59 - step: 530 acc: 0 loss: 1.6575 grad: 1.68e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.7304 data: 0.0643 lr: 7.36e-05 mem: 47% pow: 591.973 W 0: INFO 26-04-29 01:32:44.828923 - 0:15:13 - step: 540 acc: 0 loss: 1.7886 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.9009 data: 0.068 lr: 7.36e-05 mem: 47% pow: 496.769 W 0: INFO 26-04-29 01:32:58.936955 - 0:15:27 - step: 550 acc: 0 loss: 1.5362 grad: 1.59e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6501 data: 0.0654 lr: 7.36e-05 mem: 47% pow: 636.533 W 0: INFO 26-04-29 01:33:12.733869 - 0:15:41 - step: 560 acc: 0 loss: 1.5847 grad: 1.64e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5786 data: 0.1165 lr: 7.36e-05 mem: 47% pow: 649.651 W 0: INFO 26-04-29 01:33:26.461931 - 0:15:55 - step: 570 acc: 0 loss: 1.7041 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7313 data: 0.0667 lr: 7.36e-05 mem: 47% pow: 592.223 W 0: INFO 26-04-29 01:33:39.863161 - 0:16:08 - step: 580 acc: 0 loss: 1.5254 grad: 1.68e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.6122 data: 0.0688 lr: 7.35e-05 mem: 47% pow: 651.454 W 0: INFO 26-04-29 01:33:53.667104 - 0:16:22 - step: 590 acc: 0 loss: 1.4869 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6176 data: 0.0626 lr: 7.35e-05 mem: 47% pow: 658.897 W 0: INFO 26-04-29 01:34:07.673831 - 0:16:36 - step: 600 acc: 0 loss: 1.7599 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6155 data: 0.0732 lr: 7.35e-05 mem: 47% pow: 660.505 W 0: INFO 26-04-29 01:34:24.297198 - 0:16:52 - step: 610 acc: 0 loss: 1.5145 grad: 1.91e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6052 data: 0.0686 lr: 7.35e-05 mem: 54% pow: 663.297 W 0: INFO 26-04-29 01:34:38.314928 - 0:17:06 - step: 620 acc: 0 loss: 1.4561 grad: 1.65e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.68 data: 0.0748 lr: 7.35e-05 mem: 47% pow: 630.765 W 0: INFO 26-04-29 01:34:52.146464 - 0:17:20 - step: 630 acc: 0 loss: 1.5001 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6341 data: 0.0735 lr: 7.35e-05 mem: 47% pow: 641.644 W 0: INFO 26-04-29 01:35:05.949412 - 0:17:34 - step: 640 acc: 0 loss: 1.6208 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6315 data: 0.069 lr: 7.34e-05 mem: 47% pow: 636.643 W 0: INFO 26-04-29 01:35:19.557009 - 0:17:48 - step: 650 acc: 0 loss: 1.7545 grad: 1.65e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6874 data: 0.0686 lr: 7.34e-05 mem: 47% pow: 610.141 W 0: INFO 26-04-29 01:35:33.247079 - 0:18:01 - step: 660 acc: 0 loss: 1.6128 grad: 1.67e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6355 data: 0.0691 lr: 7.34e-05 mem: 47% pow: 644.709 W 0: INFO 26-04-29 01:35:46.732345 - 0:18:15 - step: 670 acc: 0 loss: 1.3673 grad: 1.60e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.624 data: 0.0699 lr: 7.34e-05 mem: 47% pow: 651.587 W 0: INFO 26-04-29 01:36:00.385555 - 0:18:28 - step: 680 acc: 0 loss: 1.5295 grad: 1.49e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7367 data: 0.0688 lr: 7.34e-05 mem: 47% pow: 598.968 W 0: INFO 26-04-29 01:36:14.732442 - 0:18:43 - step: 690 acc: 0 loss: 1.8446 grad: 1.64e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6274 data: 0.0617 lr: 7.34e-05 mem: 47% pow: 655.993 W 0: INFO 26-04-29 01:36:28.457854 - 0:18:57 - step: 700 acc: 0 loss: 1.1294 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7369 data: 0.0538 lr: 7.34e-05 mem: 47% pow: 596.282 W 0: INFO 26-04-29 01:36:44.981463 - 0:19:13 - step: 710 acc: 0 loss: 1.7758 grad: 1.68e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6308 data: 0.063 lr: 7.33e-05 mem: 54% pow: 655.441 W 0: INFO 26-04-29 01:36:58.667670 - 0:19:27 - step: 720 acc: 0 loss: 1.7584 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6741 data: 0.0737 lr: 7.33e-05 mem: 47% pow: 618.195 W 0: INFO 26-04-29 01:37:12.146222 - 0:19:40 - step: 730 acc: 0 loss: 2.0484 grad: 1.59e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6321 data: 0.0551 lr: 7.33e-05 mem: 47% pow: 655.175 W 0: INFO 26-04-29 01:37:25.758464 - 0:19:54 - step: 740 acc: 0 loss: 1.6552 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6079 data: 0.0726 lr: 7.33e-05 mem: 47% pow: 654.453 W 0: INFO 26-04-29 01:37:39.645873 - 0:20:08 - step: 750 acc: 0 loss: 1.6633 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6241 data: 0.0618 lr: 7.33e-05 mem: 47% pow: 653.286 W 0: INFO 26-04-29 01:37:53.177180 - 0:20:21 - step: 760 acc: 0 loss: 1.7905 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6409 data: 0.0554 lr: 7.33e-05 mem: 47% pow: 653.801 W 0: INFO 26-04-29 01:38:06.555817 - 0:20:35 - step: 770 acc: 0 loss: 1.6957 grad: 1.75e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6328 data: 0.0529 lr: 7.33e-05 mem: 47% pow: 652.422 W 0: INFO 26-04-29 01:38:20.163297 - 0:20:48 - step: 780 acc: 0 loss: 1.738 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6291 data: 0.0722 lr: 7.32e-05 mem: 47% pow: 640.491 W 0: INFO 26-04-29 01:38:33.646056 - 0:21:02 - step: 790 acc: 0 loss: 1.7549 grad: 1.56e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6079 data: 0.0668 lr: 7.32e-05 mem: 47% pow: 668.572 W 0: INFO 26-04-29 01:38:47.081598 - 0:21:15 - step: 800 acc: 0 loss: 1.842 grad: 1.50e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6167 data: 0.072 lr: 7.32e-05 mem: 47% pow: 652.478 W 0: INFO 26-04-29 01:39:03.411836 - 0:21:31 - step: 810 acc: 0 loss: 1.7424 grad: 1.66e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.6263 data: 0.0652 lr: 7.32e-05 mem: 54% pow: 649.21 W 0: INFO 26-04-29 01:39:17.169375 - 0:21:45 - step: 820 acc: 0 loss: 1.7219 grad: 1.49e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.5995 data: 0.0686 lr: 7.32e-05 mem: 47% pow: 669.797 W 0: INFO 26-04-29 01:39:30.834077 - 0:21:59 - step: 830 acc: 0 loss: 1.6152 grad: 1.58e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6109 data: 0.0684 lr: 7.32e-05 mem: 47% pow: 667.339 W 0: INFO 26-04-29 01:39:45.153390 - 0:22:13 - step: 840 acc: 0 loss: 1.6702 grad: 1.56e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6022 data: 0.0715 lr: 7.32e-05 mem: 47% pow: 664.052 W 0: INFO 26-04-29 01:39:58.902996 - 0:22:27 - step: 850 acc: 0 loss: 1.4222 grad: 1.65e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6142 data: 0.0635 lr: 7.31e-05 mem: 47% pow: 660.152 W 0: INFO 26-04-29 01:40:12.432391 - 0:22:41 - step: 860 acc: 0 loss: 1.3401 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6019 data: 0.0739 lr: 7.31e-05 mem: 47% pow: 659.74 W 0: INFO 26-04-29 01:40:26.156927 - 0:22:54 - step: 870 acc: 0 loss: 1.6002 grad: 1.63e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5823 data: 0.0956 lr: 7.31e-05 mem: 47% pow: 655.55 W 0: INFO 26-04-29 01:40:39.533837 - 0:23:08 - step: 880 acc: 0 loss: 1.6587 grad: 1.49e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6181 data: 0.0604 lr: 7.31e-05 mem: 47% pow: 648.507 W 0: INFO 26-04-29 01:40:53.501061 - 0:23:22 - step: 890 acc: 0 loss: 1.8472 grad: 1.77e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6071 data: 0.0671 lr: 7.31e-05 mem: 47% pow: 663.595 W 0: INFO 26-04-29 01:41:07.438026 - 0:23:36 - step: 900 acc: 0 loss: 1.5353 grad: 1.67e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6563 data: 0.0638 lr: 7.31e-05 mem: 47% pow: 628.904 W 0: INFO 26-04-29 01:41:25.427242 - 0:23:54 - step: 910 acc: 0 loss: 1.7581 grad: 1.61e-01 flops: 3.14e+14 wps: 3.64e+04 iter: 0.6032 data: 0.0665 lr: 7.30e-05 mem: 54% pow: 665.436 W 0: INFO 26-04-29 01:41:39.323876 - 0:24:07 - step: 920 acc: 0 loss: 1.8787 grad: 1.66e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6248 data: 0.0706 lr: 7.30e-05 mem: 47% pow: 649.131 W 0: INFO 26-04-29 01:41:53.230612 - 0:24:21 - step: 930 acc: 0 loss: 1.5797 grad: 1.63e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6865 data: 0.0666 lr: 7.30e-05 mem: 47% pow: 620.655 W 0: INFO 26-04-29 01:42:06.841263 - 0:24:35 - step: 940 acc: 0 loss: 1.761 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6118 data: 0.0692 lr: 7.30e-05 mem: 47% pow: 658.787 W 0: INFO 26-04-29 01:42:20.588507 - 0:24:49 - step: 950 acc: 0 loss: 1.5538 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.617 data: 0.0674 lr: 7.30e-05 mem: 47% pow: 656.05 W 0: INFO 26-04-29 01:42:34.506387 - 0:25:03 - step: 960 acc: 0 loss: 1.6281 grad: 1.54e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6371 data: 0.0669 lr: 7.30e-05 mem: 47% pow: 652.562 W 0: INFO 26-04-29 01:42:48.167355 - 0:25:16 - step: 970 acc: 0 loss: 1.686 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6148 data: 0.0677 lr: 7.30e-05 mem: 47% pow: 659.501 W 0: INFO 26-04-29 01:43:01.923579 - 0:25:30 - step: 980 acc: 0 loss: 1.5279 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6097 data: 0.0639 lr: 7.29e-05 mem: 47% pow: 672.204 W 0: INFO 26-04-29 01:43:16.008698 - 0:25:44 - step: 990 acc: 0 loss: 1.4759 grad: 1.52e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6224 data: 0.0636 lr: 7.29e-05 mem: 47% pow: 654.624 W 0: INFO 26-04-29 01:43:29.778221 - 0:25:58 - step: 1000 acc: 0 loss: 1.7226 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6919 data: 0.0677 lr: 7.29e-05 mem: 47% pow: 611.132 W 0: INFO 26-04-29 01:43:33.449035 - 0:26:02 - garbage collection 0: INFO 26-04-29 01:43:48.426831 - 0:26:17 - step: 1010 acc: 0 loss: 1.4821 grad: 1.53e-01 flops: 3.03e+14 wps: 3.52e+04 iter: 0.8911 data: 0.0693 lr: 7.29e-05 mem: 54% pow: 495.025 W 0: INFO 26-04-29 01:44:02.133570 - 0:26:30 - step: 1020 acc: 0 loss: 1.851 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6893 data: 0.0026 lr: 7.29e-05 mem: 47% pow: 650.462 W 0: INFO 26-04-29 01:44:16.056915 - 0:26:44 - step: 1030 acc: 0 loss: 1.4001 grad: 1.64e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7378 data: 0.0751 lr: 7.29e-05 mem: 47% pow: 592.668 W 0: INFO 26-04-29 01:44:29.726920 - 0:26:58 - step: 1040 acc: 0 loss: 1.6869 grad: 1.57e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6347 data: 0.069 lr: 7.29e-05 mem: 47% pow: 647.266 W 0: INFO 26-04-29 01:44:43.671442 - 0:27:12 - step: 1050 acc: 0 loss: 1.7923 grad: 1.80e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.877 data: 0.0722 lr: 7.28e-05 mem: 47% pow: 505.831 W 0: INFO 26-04-29 01:44:57.478791 - 0:27:26 - step: 1060 acc: 0 loss: 1.7199 grad: 1.70e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6344 data: 0.0688 lr: 7.28e-05 mem: 47% pow: 662.307 W 0: INFO 26-04-29 01:45:11.177339 - 0:27:39 - step: 1070 acc: 0 loss: 1.5319 grad: 1.66e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.63 data: 0.0645 lr: 7.28e-05 mem: 47% pow: 655.595 W 0: INFO 26-04-29 01:45:24.830258 - 0:27:53 - step: 1080 acc: 0 loss: 1.8438 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6177 data: 0.0641 lr: 7.28e-05 mem: 47% pow: 654.139 W 0: INFO 26-04-29 01:45:39.578561 - 0:28:08 - step: 1090 acc: 0 loss: 1.8381 grad: 1.51e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6507 data: 0.0678 lr: 7.28e-05 mem: 47% pow: 630.352 W 0: INFO 26-04-29 01:45:53.230700 - 0:28:21 - step: 1100 acc: 0 loss: 1.536 grad: 1.63e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6031 data: 0.0811 lr: 7.28e-05 mem: 47% pow: 651.498 W 0: INFO 26-04-29 01:46:09.728023 - 0:28:38 - step: 1110 acc: 0 loss: 1.7593 grad: 1.64e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6178 data: 0.0709 lr: 7.27e-05 mem: 54% pow: 659.946 W 0: INFO 26-04-29 01:46:23.710600 - 0:28:52 - step: 1120 acc: 0 loss: 1.7643 grad: 1.58e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6317 data: 0.073 lr: 7.27e-05 mem: 47% pow: 638.43 W 0: INFO 26-04-29 01:46:37.610697 - 0:29:06 - step: 1130 acc: 0 loss: 2.1924 grad: 1.48e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6397 data: 0.0687 lr: 7.27e-05 mem: 47% pow: 644.674 W 0: INFO 26-04-29 01:46:51.647822 - 0:29:20 - step: 1140 acc: 0 loss: 1.7303 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6211 data: 0.0874 lr: 7.27e-05 mem: 47% pow: 640.885 W 0: INFO 26-04-29 01:47:05.541972 - 0:29:34 - step: 1150 acc: 0 loss: 1.649 grad: 1.60e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.8407 data: 0.0747 lr: 7.27e-05 mem: 47% pow: 521.73 W 0: INFO 26-04-29 01:47:19.265680 - 0:29:47 - step: 1160 acc: 0 loss: 1.6424 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.637 data: 0.0642 lr: 7.27e-05 mem: 47% pow: 639.412 W 0: INFO 26-04-29 01:47:34.343907 - 0:30:02 - step: 1170 acc: 0 loss: 1.3315 grad: 1.71e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.6164 data: 0.0759 lr: 7.27e-05 mem: 47% pow: 647.008 W 0: INFO 26-04-29 01:47:48.093938 - 0:30:16 - step: 1180 acc: 0 loss: 1.7709 grad: 1.82e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6865 data: 0.0672 lr: 7.26e-05 mem: 47% pow: 610.228 W 0: INFO 26-04-29 01:48:02.348037 - 0:30:30 - step: 1190 acc: 0 loss: 1.6963 grad: 1.60e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6172 data: 0.0848 lr: 7.26e-05 mem: 47% pow: 638.8 W 0: INFO 26-04-29 01:48:16.311883 - 0:30:44 - step: 1200 acc: 0 loss: 1.4762 grad: 1.60e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6554 data: 0.0772 lr: 7.26e-05 mem: 47% pow: 636.242 W 0: INFO 26-04-29 01:48:32.652265 - 0:31:01 - step: 1210 acc: 0 loss: 1.7552 grad: 1.77e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.6019 data: 0.0803 lr: 7.26e-05 mem: 54% pow: 651.676 W 0: INFO 26-04-29 01:48:46.409100 - 0:31:14 - step: 1220 acc: 0 loss: 1.8614 grad: 1.57e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6077 data: 0.0645 lr: 7.26e-05 mem: 47% pow: 670.259 W 0: INFO 26-04-29 01:49:00.296730 - 0:31:28 - step: 1230 acc: 0 loss: 1.8303 grad: 1.58e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6152 data: 0.0636 lr: 7.26e-05 mem: 47% pow: 650.214 W 0: INFO 26-04-29 01:49:14.465329 - 0:31:43 - step: 1240 acc: 0 loss: 1.6001 grad: 1.53e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6238 data: 0.0686 lr: 7.26e-05 mem: 47% pow: 653.213 W 0: INFO 26-04-29 01:49:28.259701 - 0:31:56 - step: 1250 acc: 0 loss: 1.9613 grad: 1.67e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6113 data: 0.0711 lr: 7.25e-05 mem: 47% pow: 656.802 W 0: INFO 26-04-29 01:49:41.962697 - 0:32:10 - step: 1260 acc: 0 loss: 1.7428 grad: 1.62e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.626 data: 0.0657 lr: 7.25e-05 mem: 47% pow: 650.166 W 0: INFO 26-04-29 01:49:56.209261 - 0:32:24 - step: 1270 acc: 0 loss: 1.2936 grad: 1.52e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.628 data: 0.0653 lr: 7.25e-05 mem: 47% pow: 665.405 W 0: INFO 26-04-29 01:50:09.890828 - 0:32:38 - step: 1280 acc: 0 loss: 1.7247 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6137 data: 0.0678 lr: 7.25e-05 mem: 47% pow: 655.456 W 0: INFO 26-04-29 01:50:23.575159 - 0:32:52 - step: 1290 acc: 0 loss: 1.8045 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6508 data: 0.0682 lr: 7.25e-05 mem: 47% pow: 632.968 W 0: INFO 26-04-29 01:50:37.183505 - 0:33:05 - step: 1300 acc: 0 loss: 1.5253 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6328 data: 0.0708 lr: 7.25e-05 mem: 47% pow: 643.823 W 0: INFO 26-04-29 01:50:54.229246 - 0:33:22 - step: 1310 acc: 0 loss: 1.6118 grad: 1.49e-01 flops: 3.31e+14 wps: 3.85e+04 iter: 0.6162 data: 0.0722 lr: 7.25e-05 mem: 54% pow: 666.779 W 0: INFO 26-04-29 01:51:08.066736 - 0:33:36 - step: 1320 acc: 0 loss: 1.8551 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7839 data: 0.0643 lr: 7.24e-05 mem: 47% pow: 568.838 W 0: INFO 26-04-29 01:51:21.880862 - 0:33:50 - step: 1330 acc: 0 loss: 1.6958 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.8256 data: 0.0792 lr: 7.24e-05 mem: 47% pow: 529.432 W 0: INFO 26-04-29 01:51:35.758770 - 0:34:04 - step: 1340 acc: 0 loss: 1.7414 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.618 data: 0.0759 lr: 7.24e-05 mem: 47% pow: 650.221 W 0: INFO 26-04-29 01:51:49.762482 - 0:34:18 - step: 1350 acc: 0 loss: 1.5037 grad: 1.65e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6635 data: 0.0491 lr: 7.24e-05 mem: 47% pow: 635.719 W 0: INFO 26-04-29 01:52:03.383274 - 0:34:31 - step: 1360 acc: 0 loss: 1.637 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6074 data: 0.0752 lr: 7.24e-05 mem: 47% pow: 657.734 W 0: INFO 26-04-29 01:52:17.254085 - 0:34:45 - step: 1370 acc: 0 loss: 1.7294 grad: 1.58e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.8149 data: 0.0737 lr: 7.24e-05 mem: 47% pow: 542.567 W 0: INFO 26-04-29 01:52:31.150076 - 0:34:59 - step: 1380 acc: 0 loss: 1.7777 grad: 1.62e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6097 data: 0.0786 lr: 7.23e-05 mem: 47% pow: 664.204 W 0: INFO 26-04-29 01:52:44.698585 - 0:35:13 - step: 1390 acc: 0 loss: 2.1044 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5892 data: 0.108 lr: 7.23e-05 mem: 47% pow: 645.094 W 0: INFO 26-04-29 01:52:58.682565 - 0:35:27 - step: 1400 acc: 0 loss: 1.6052 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6199 data: 0.0657 lr: 7.23e-05 mem: 47% pow: 659.092 W 0: INFO 26-04-29 01:53:15.264825 - 0:35:43 - step: 1410 acc: 0 loss: 1.5155 grad: 1.51e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6164 data: 0.0694 lr: 7.23e-05 mem: 54% pow: 660.529 W 0: INFO 26-04-29 01:53:29.013692 - 0:35:57 - step: 1420 acc: 0 loss: 1.5678 grad: 1.61e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6422 data: 0.0638 lr: 7.23e-05 mem: 47% pow: 639.65 W 0: INFO 26-04-29 01:53:42.864754 - 0:36:11 - step: 1430 acc: 0 loss: 1.8674 grad: 1.67e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6309 data: 0.0704 lr: 7.23e-05 mem: 47% pow: 643.828 W 0: INFO 26-04-29 01:53:56.540036 - 0:36:25 - step: 1440 acc: 0 loss: 1.8476 grad: 1.63e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6435 data: 0.0698 lr: 7.23e-05 mem: 47% pow: 638.598 W 0: INFO 26-04-29 01:54:10.174120 - 0:36:38 - step: 1450 acc: 0 loss: 1.8616 grad: 1.68e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6162 data: 0.0709 lr: 7.22e-05 mem: 47% pow: 664.277 W 0: INFO 26-04-29 01:54:23.935632 - 0:36:52 - step: 1460 acc: 0 loss: 1.6658 grad: 1.67e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6327 data: 0.074 lr: 7.22e-05 mem: 47% pow: 645.466 W 0: INFO 26-04-29 01:54:37.948495 - 0:37:06 - step: 1470 acc: 0 loss: 1.7353 grad: 1.56e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6445 data: 0.0627 lr: 7.22e-05 mem: 47% pow: 641.708 W 0: INFO 26-04-29 01:54:51.713228 - 0:37:20 - step: 1480 acc: 0 loss: 1.5519 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6002 data: 0.0911 lr: 7.22e-05 mem: 47% pow: 658.202 W 0: INFO 26-04-29 01:55:05.575843 - 0:37:34 - step: 1490 acc: 0 loss: 2.0595 grad: 1.55e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6643 data: 0.068 lr: 7.22e-05 mem: 47% pow: 628.366 W 0: INFO 26-04-29 01:55:19.120974 - 0:37:47 - step: 1500 acc: 0 loss: 1.902 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6221 data: 0.0783 lr: 7.22e-05 mem: 47% pow: 640.514 W 0: INFO 26-04-29 01:55:36.221551 - 0:38:04 - step: 1510 acc: 0 loss: 1.3196 grad: 1.73e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6236 data: 0.0732 lr: 7.22e-05 mem: 54% pow: 641.371 W 0: INFO 26-04-29 01:55:49.873202 - 0:38:18 - step: 1520 acc: 0 loss: 1.529 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.623 data: 0.0702 lr: 7.21e-05 mem: 47% pow: 651.772 W 0: INFO 26-04-29 01:56:03.610028 - 0:38:32 - step: 1530 acc: 0 loss: 1.8898 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6288 data: 0.0683 lr: 7.21e-05 mem: 47% pow: 641.677 W 0: INFO 26-04-29 01:56:17.574018 - 0:38:46 - step: 1540 acc: 0 loss: 1.8463 grad: 1.93e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6638 data: 0.0693 lr: 7.21e-05 mem: 47% pow: 624.321 W 0: INFO 26-04-29 01:56:31.364761 - 0:38:59 - step: 1550 acc: 0 loss: 1.7352 grad: 1.61e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6249 data: 0.0937 lr: 7.21e-05 mem: 47% pow: 628.586 W 0: INFO 26-04-29 01:56:45.496960 - 0:39:14 - step: 1560 acc: 0 loss: 1.5533 grad: 1.51e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6188 data: 0.069 lr: 7.21e-05 mem: 47% pow: 662.097 W 0: INFO 26-04-29 01:56:59.157750 - 0:39:27 - step: 1570 acc: 0 loss: 1.744 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6231 data: 0.0702 lr: 7.21e-05 mem: 47% pow: 643.76 W 0: INFO 26-04-29 01:57:12.780813 - 0:39:41 - step: 1580 acc: 0 loss: 2.0016 grad: 1.59e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6144 data: 0.0765 lr: 7.21e-05 mem: 47% pow: 673.596 W 0: INFO 26-04-29 01:57:26.715815 - 0:39:55 - step: 1590 acc: 0 loss: 1.6597 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6447 data: 0.0722 lr: 7.20e-05 mem: 47% pow: 634.783 W 0: INFO 26-04-29 01:57:40.601348 - 0:40:09 - step: 1600 acc: 0 loss: 1.8777 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5991 data: 0.082 lr: 7.20e-05 mem: 47% pow: 661.166 W 0: INFO 26-04-29 01:57:57.409741 - 0:40:25 - step: 1610 acc: 0 loss: 1.6629 grad: 1.56e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6174 data: 0.0726 lr: 7.20e-05 mem: 54% pow: 651.769 W 0: INFO 26-04-29 01:58:10.901101 - 0:40:39 - step: 1620 acc: 0 loss: 1.4079 grad: 1.57e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6254 data: 0.0709 lr: 7.20e-05 mem: 47% pow: 648.619 W 0: INFO 26-04-29 01:58:24.786431 - 0:40:53 - step: 1630 acc: 0 loss: 1.6645 grad: 1.63e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6149 data: 0.0701 lr: 7.20e-05 mem: 47% pow: 647.298 W 0: INFO 26-04-29 01:58:38.230273 - 0:41:06 - step: 1640 acc: 0 loss: 1.7837 grad: 1.78e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6102 data: 0.0718 lr: 7.20e-05 mem: 47% pow: 651.188 W 0: INFO 26-04-29 01:58:51.801855 - 0:41:20 - step: 1650 acc: 0 loss: 1.6621 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6063 data: 0.0685 lr: 7.19e-05 mem: 47% pow: 662.485 W 0: INFO 26-04-29 01:59:05.244310 - 0:41:33 - step: 1660 acc: 0 loss: 1.591 grad: 2.10e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6255 data: 0.0697 lr: 7.19e-05 mem: 47% pow: 646.995 W 0: INFO 26-04-29 01:59:18.790095 - 0:41:47 - step: 1670 acc: 0 loss: 1.9092 grad: 1.52e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6168 data: 0.0698 lr: 7.19e-05 mem: 47% pow: 659.821 W 0: INFO 26-04-29 01:59:32.681536 - 0:42:01 - step: 1680 acc: 0 loss: 1.8873 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6322 data: 0.0673 lr: 7.19e-05 mem: 47% pow: 643.207 W 0: INFO 26-04-29 01:59:46.190965 - 0:42:14 - step: 1690 acc: 0 loss: 1.7885 grad: 1.71e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6146 data: 0.0793 lr: 7.19e-05 mem: 47% pow: 669.479 W 0: INFO 26-04-29 02:00:00.251877 - 0:42:28 - step: 1700 acc: 0 loss: 1.9253 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6125 data: 0.0678 lr: 7.19e-05 mem: 47% pow: 677.799 W 0: INFO 26-04-29 02:00:16.711261 - 0:42:45 - step: 1710 acc: 0 loss: 1.9017 grad: 1.58e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6085 data: 0.0706 lr: 7.19e-05 mem: 54% pow: 677.283 W 0: INFO 26-04-29 02:00:30.600071 - 0:42:59 - step: 1720 acc: 0 loss: 1.4616 grad: 1.67e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6126 data: 0.0807 lr: 7.18e-05 mem: 47% pow: 657.886 W 0: INFO 26-04-29 02:00:44.333573 - 0:43:12 - step: 1730 acc: 0 loss: 1.695 grad: 1.86e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6094 data: 0.0706 lr: 7.18e-05 mem: 47% pow: 651.368 W 0: INFO 26-04-29 02:00:57.845158 - 0:43:26 - step: 1740 acc: 0 loss: 1.8856 grad: 1.58e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6352 data: 0.0691 lr: 7.18e-05 mem: 47% pow: 640.445 W 0: INFO 26-04-29 02:01:11.397529 - 0:43:39 - step: 1750 acc: 0 loss: 1.7509 grad: 2.84e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6103 data: 0.0794 lr: 7.18e-05 mem: 47% pow: 648.28 W 0: INFO 26-04-29 02:01:24.978257 - 0:43:53 - step: 1760 acc: 0 loss: 1.3613 grad: 1.72e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6421 data: 0.0702 lr: 7.18e-05 mem: 47% pow: 645.213 W 0: INFO 26-04-29 02:01:38.763186 - 0:44:07 - step: 1770 acc: 0 loss: 1.5527 grad: 1.82e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6068 data: 0.0748 lr: 7.18e-05 mem: 47% pow: 652.38 W 0: INFO 26-04-29 02:01:52.377498 - 0:44:20 - step: 1780 acc: 0 loss: 1.943 grad: 1.73e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6068 data: 0.0701 lr: 7.18e-05 mem: 47% pow: 663.258 W 0: INFO 26-04-29 02:02:05.654172 - 0:44:34 - step: 1790 acc: 0 loss: 1.8281 grad: 1.60e-01 flops: 4.26e+14 wps: 4.94e+04 iter: 0.5982 data: 0.0713 lr: 7.17e-05 mem: 47% pow: 677.764 W 0: INFO 26-04-29 02:02:19.207626 - 0:44:47 - step: 1800 acc: 0 loss: 1.6725 grad: 1.52e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6287 data: 0.0695 lr: 7.17e-05 mem: 47% pow: 646.598 W 0: INFO 26-04-29 02:02:35.683539 - 0:45:04 - step: 1810 acc: 0 loss: 1.7587 grad: 1.56e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6113 data: 0.0666 lr: 7.17e-05 mem: 54% pow: 659.754 W 0: INFO 26-04-29 02:02:49.236051 - 0:45:17 - step: 1820 acc: 0 loss: 1.4749 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6223 data: 0.0655 lr: 7.17e-05 mem: 47% pow: 652.729 W 0: INFO 26-04-29 02:03:02.718528 - 0:45:31 - step: 1830 acc: 0 loss: 1.5322 grad: 1.67e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5975 data: 0.0811 lr: 7.17e-05 mem: 47% pow: 665.648 W 0: INFO 26-04-29 02:03:16.256295 - 0:45:44 - step: 1840 acc: 0 loss: 1.8631 grad: 1.66e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6285 data: 0.0471 lr: 7.17e-05 mem: 47% pow: 660.762 W 0: INFO 26-04-29 02:03:29.910014 - 0:45:58 - step: 1850 acc: 0 loss: 1.5416 grad: 1.50e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6988 data: 0.0696 lr: 7.16e-05 mem: 47% pow: 598.913 W 0: INFO 26-04-29 02:03:43.480595 - 0:46:12 - step: 1860 acc: 0 loss: 1.5811 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6252 data: 0.073 lr: 7.16e-05 mem: 47% pow: 648.864 W 0: INFO 26-04-29 02:03:56.989817 - 0:46:25 - step: 1870 acc: 0 loss: 1.7044 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6156 data: 0.0678 lr: 7.16e-05 mem: 47% pow: 653.444 W 0: INFO 26-04-29 02:04:10.524069 - 0:46:39 - step: 1880 acc: 0 loss: 1.6507 grad: 1.61e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6195 data: 0.0731 lr: 7.16e-05 mem: 47% pow: 661.939 W 0: INFO 26-04-29 02:04:23.982834 - 0:46:52 - step: 1890 acc: 0 loss: 1.9993 grad: 1.68e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6189 data: 0.0705 lr: 7.16e-05 mem: 47% pow: 663.458 W 0: INFO 26-04-29 02:04:37.543981 - 0:47:06 - step: 1900 acc: 0 loss: 1.8247 grad: 1.68e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6497 data: 0.0729 lr: 7.16e-05 mem: 47% pow: 627.296 W 0: INFO 26-04-29 02:04:54.860826 - 0:47:23 - step: 1910 acc: 0 loss: 1.5747 grad: 1.60e-01 flops: 3.26e+14 wps: 3.79e+04 iter: 1.3814 data: 0.0665 lr: 7.16e-05 mem: 54% pow: 406.269 W 0: INFO 26-04-29 02:05:08.258260 - 0:47:36 - step: 1920 acc: 0 loss: 1.5988 grad: 1.54e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.6385 data: 0.0583 lr: 7.15e-05 mem: 47% pow: 649.836 W 0: INFO 26-04-29 02:05:21.868803 - 0:47:50 - step: 1930 acc: 0 loss: 1.5876 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6294 data: 0.0741 lr: 7.15e-05 mem: 47% pow: 655.319 W 0: INFO 26-04-29 02:05:35.621146 - 0:48:04 - step: 1940 acc: 0 loss: 1.5029 grad: 1.87e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6142 data: 0.0701 lr: 7.15e-05 mem: 47% pow: 654.716 W 0: INFO 26-04-29 02:05:49.266731 - 0:48:17 - step: 1950 acc: 0 loss: 1.7214 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6418 data: 0.0472 lr: 7.15e-05 mem: 47% pow: 669.746 W 0: INFO 26-04-29 02:06:03.493415 - 0:48:32 - step: 1960 acc: 0 loss: 1.886 grad: 1.54e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6227 data: 0.0688 lr: 7.15e-05 mem: 47% pow: 646.719 W 0: INFO 26-04-29 02:06:17.084394 - 0:48:45 - step: 1970 acc: 0 loss: 1.5547 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6149 data: 0.0683 lr: 7.15e-05 mem: 47% pow: 655.673 W 0: INFO 26-04-29 02:06:30.765180 - 0:48:59 - step: 1980 acc: 0 loss: 1.5501 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6636 data: 0.0678 lr: 7.15e-05 mem: 47% pow: 631.5 W 0: INFO 26-04-29 02:06:46.065364 - 0:49:14 - step: 1990 acc: 0 loss: 1.7899 grad: 1.69e-01 flops: 3.69e+14 wps: 4.28e+04 iter: 0.6218 data: 0.062 lr: 7.14e-05 mem: 47% pow: 653.038 W 0: INFO 26-04-29 02:06:59.570011 - 0:49:28 - step: 2000 acc: 0 loss: 1.877 grad: 1.61e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6409 data: 0.0514 lr: 7.14e-05 mem: 47% pow: 648.196 W 0: INFO 26-04-29 02:07:03.205635 - 0:49:31 - garbage collection 0: INFO 26-04-29 02:07:18.050318 - 0:49:46 - step: 2010 acc: 0 loss: 1.7576 grad: 1.57e-01 flops: 3.06e+14 wps: 3.55e+04 iter: 0.6207 data: 0.0679 lr: 7.14e-05 mem: 54% pow: 649.469 W 0: INFO 26-04-29 02:07:32.550114 - 0:50:01 - step: 2020 acc: 0 loss: 1.4784 grad: 1.63e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.6253 data: 0.0686 lr: 7.14e-05 mem: 47% pow: 649.826 W 0: INFO 26-04-29 02:07:46.356462 - 0:50:14 - step: 2030 acc: 0 loss: 1.8881 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6234 data: 0.0712 lr: 7.14e-05 mem: 47% pow: 650.722 W 0: INFO 26-04-29 02:08:00.482800 - 0:50:29 - step: 2040 acc: 0 loss: 1.646 grad: 1.52e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6087 data: 0.0656 lr: 7.14e-05 mem: 47% pow: 657.962 W 0: INFO 26-04-29 02:08:14.418760 - 0:50:43 - step: 2050 acc: 0 loss: 1.4973 grad: 1.89e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.624 data: 0.0725 lr: 7.14e-05 mem: 47% pow: 646.364 W 0: INFO 26-04-29 02:08:28.061830 - 0:50:56 - step: 2060 acc: 0 loss: 1.4425 grad: 1.67e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6049 data: 0.0679 lr: 7.13e-05 mem: 47% pow: 653.001 W 0: INFO 26-04-29 02:08:42.824393 - 0:51:11 - step: 2070 acc: 0 loss: 1.7852 grad: 1.51e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6279 data: 0.0727 lr: 7.13e-05 mem: 47% pow: 639.569 W 0: INFO 26-04-29 02:08:58.876274 - 0:51:27 - step: 2080 acc: 0 loss: 1.7822 grad: 1.49e-01 flops: 3.52e+14 wps: 4.08e+04 iter: 0.6004 data: 0.0742 lr: 7.13e-05 mem: 47% pow: 672.68 W 0: INFO 26-04-29 02:09:14.917028 - 0:51:43 - step: 2090 acc: 0 loss: 1.5586 grad: 1.58e-01 flops: 3.52e+14 wps: 4.09e+04 iter: 0.6514 data: 0.0638 lr: 7.13e-05 mem: 47% pow: 635.921 W 0: INFO 26-04-29 02:09:29.130363 - 0:51:57 - step: 2100 acc: 0 loss: 1.7376 grad: 1.61e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.7113 data: 0.0719 lr: 7.13e-05 mem: 47% pow: 602.055 W 0: INFO 26-04-29 02:09:45.721026 - 0:52:14 - step: 2110 acc: 0 loss: 1.5519 grad: 1.58e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6079 data: 0.0698 lr: 7.13e-05 mem: 54% pow: 656.542 W 0: INFO 26-04-29 02:09:59.674641 - 0:52:28 - step: 2120 acc: 0 loss: 1.8461 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6208 data: 0.0639 lr: 7.12e-05 mem: 47% pow: 649.17 W 0: INFO 26-04-29 02:10:13.647179 - 0:52:42 - step: 2130 acc: 0 loss: 1.4896 grad: 1.61e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6118 data: 0.0686 lr: 7.12e-05 mem: 47% pow: 659.45 W 0: INFO 26-04-29 02:10:27.961674 - 0:52:56 - step: 2140 acc: 0 loss: 1.3766 grad: 1.60e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6317 data: 0.0686 lr: 7.12e-05 mem: 47% pow: 639.587 W 0: INFO 26-04-29 02:10:42.211945 - 0:53:10 - step: 2150 acc: 0 loss: 1.8008 grad: 1.58e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6256 data: 0.0735 lr: 7.12e-05 mem: 47% pow: 650.061 W 0: INFO 26-04-29 02:10:57.741267 - 0:53:26 - step: 2160 acc: 0 loss: 1.3551 grad: 1.55e-01 flops: 3.64e+14 wps: 4.22e+04 iter: 0.6268 data: 0.0726 lr: 7.12e-05 mem: 47% pow: 641.97 W 0: INFO 26-04-29 02:11:12.576550 - 0:53:41 - step: 2170 acc: 0 loss: 1.4286 grad: 1.65e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6755 data: 0.0029 lr: 7.12e-05 mem: 47% pow: 677.337 W 0: INFO 26-04-29 02:11:26.405014 - 0:53:54 - step: 2180 acc: 0 loss: 1.4657 grad: 1.61e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6414 data: 0.0684 lr: 7.12e-05 mem: 47% pow: 629.581 W 0: INFO 26-04-29 02:11:40.147174 - 0:54:08 - step: 2190 acc: 0 loss: 1.8165 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6192 data: 0.0734 lr: 7.11e-05 mem: 47% pow: 644.695 W 0: INFO 26-04-29 02:11:53.868977 - 0:54:22 - step: 2200 acc: 0 loss: 1.4823 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6314 data: 0.0685 lr: 7.11e-05 mem: 47% pow: 640.139 W 0: INFO 26-04-29 02:12:11.553817 - 0:54:40 - step: 2210 acc: 0 loss: 1.5127 grad: 1.59e-01 flops: 3.20e+14 wps: 3.71e+04 iter: 1.529 data: 0.0889 lr: 7.11e-05 mem: 54% pow: 442.708 W 0: INFO 26-04-29 02:12:25.492259 - 0:54:54 - step: 2220 acc: 0 loss: 1.6199 grad: 1.61e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6189 data: 0.0687 lr: 7.11e-05 mem: 47% pow: 652.875 W 0: INFO 26-04-29 02:12:39.580260 - 0:55:08 - step: 2230 acc: 0 loss: 1.506 grad: 1.51e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6756 data: 0.0028 lr: 7.11e-05 mem: 47% pow: 655.284 W 0: INFO 26-04-29 02:12:53.534528 - 0:55:22 - step: 2240 acc: 0 loss: 1.7968 grad: 1.61e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6117 data: 0.0723 lr: 7.11e-05 mem: 47% pow: 652.467 W 0: INFO 26-04-29 02:13:07.072585 - 0:55:35 - step: 2250 acc: 0 loss: 1.4219 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6287 data: 0.0623 lr: 7.11e-05 mem: 47% pow: 653.77 W 0: INFO 26-04-29 02:13:23.105628 - 0:55:51 - step: 2260 acc: 0 loss: 1.6307 grad: 1.55e-01 flops: 3.52e+14 wps: 4.09e+04 iter: 0.9605 data: 0.0025 lr: 7.10e-05 mem: 47% pow: 489.094 W 0: INFO 26-04-29 02:13:36.879432 - 0:56:05 - step: 2270 acc: 0 loss: 1.8491 grad: 1.65e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6315 data: 0.0649 lr: 7.10e-05 mem: 47% pow: 642.783 W 0: INFO 26-04-29 02:13:50.306427 - 0:56:18 - step: 2280 acc: 0 loss: 1.6802 grad: 1.50e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.611 data: 0.0668 lr: 7.10e-05 mem: 47% pow: 664.015 W 0: INFO 26-04-29 02:14:06.182602 - 0:56:34 - step: 2290 acc: 0 loss: 1.3861 grad: 1.46e-01 flops: 3.56e+14 wps: 4.13e+04 iter: 0.6295 data: 0.0708 lr: 7.10e-05 mem: 47% pow: 642.357 W 0: INFO 26-04-29 02:14:19.874325 - 0:56:48 - step: 2300 acc: 0 loss: 1.4777 grad: 1.54e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6141 data: 0.0703 lr: 7.10e-05 mem: 47% pow: 652.998 W 0: INFO 26-04-29 02:14:36.544960 - 0:57:05 - step: 2310 acc: 0 loss: 1.6223 grad: 1.58e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.598 data: 0.0763 lr: 7.10e-05 mem: 54% pow: 657.106 W 0: INFO 26-04-29 02:14:50.858252 - 0:57:19 - step: 2320 acc: 0 loss: 1.4911 grad: 1.52e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5866 data: 0.0833 lr: 7.09e-05 mem: 47% pow: 664.128 W 0: INFO 26-04-29 02:15:04.446164 - 0:57:33 - step: 2330 acc: 0 loss: 1.4971 grad: 1.51e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6097 data: 0.0676 lr: 7.09e-05 mem: 47% pow: 672.219 W 0: INFO 26-04-29 02:15:17.885933 - 0:57:46 - step: 2340 acc: 0 loss: 1.6679 grad: 1.45e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6384 data: 0.065 lr: 7.09e-05 mem: 47% pow: 645.414 W 0: INFO 26-04-29 02:15:31.310423 - 0:57:59 - step: 2350 acc: 0 loss: 1.5891 grad: 1.51e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6238 data: 0.0649 lr: 7.09e-05 mem: 47% pow: 656.515 W 0: INFO 26-04-29 02:15:44.940105 - 0:58:13 - step: 2360 acc: 0 loss: 1.6214 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6236 data: 0.068 lr: 7.09e-05 mem: 47% pow: 653.573 W 0: INFO 26-04-29 02:16:04.347617 - 0:58:32 - step: 2370 acc: 0 loss: 1.8386 grad: 1.65e-01 flops: 2.91e+14 wps: 3.38e+04 iter: 0.7024 data: 0.0028 lr: 7.09e-05 mem: 47% pow: 637.416 W 0: INFO 26-04-29 02:16:18.143907 - 0:58:46 - step: 2380 acc: 0 loss: 1.6985 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.735 data: 0.0028 lr: 7.09e-05 mem: 47% pow: 622.134 W 0: INFO 26-04-29 02:16:31.788374 - 0:59:00 - step: 2390 acc: 0 loss: 1.6986 grad: 1.56e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6877 data: 0.0028 lr: 7.08e-05 mem: 47% pow: 660.342 W 0: INFO 26-04-29 02:16:45.308570 - 0:59:13 - step: 2400 acc: 0 loss: 1.8161 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6631 data: 0.0028 lr: 7.08e-05 mem: 47% pow: 662.853 W 0: INFO 26-04-29 02:17:01.813381 - 0:59:30 - step: 2410 acc: 0 loss: 1.5473 grad: 1.65e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.614 data: 0.0733 lr: 7.08e-05 mem: 54% pow: 654.27 W 0: INFO 26-04-29 02:17:15.517380 - 0:59:44 - step: 2420 acc: 0 loss: 1.6706 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6224 data: 0.0726 lr: 7.08e-05 mem: 47% pow: 641.9 W 0: INFO 26-04-29 02:17:29.174255 - 0:59:57 - step: 2430 acc: 0 loss: 1.9967 grad: 1.67e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6603 data: 0.0673 lr: 7.08e-05 mem: 47% pow: 631.537 W 0: INFO 26-04-29 02:17:42.722240 - 1:00:11 - step: 2440 acc: 0 loss: 1.3977 grad: 1.61e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6021 data: 0.0695 lr: 7.08e-05 mem: 47% pow: 656.101 W 0: INFO 26-04-29 02:17:56.126216 - 1:00:24 - step: 2450 acc: 0 loss: 1.241 grad: 1.57e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6106 data: 0.0717 lr: 7.08e-05 mem: 47% pow: 660.004 W 0: INFO 26-04-29 02:18:11.212617 - 1:00:39 - step: 2460 acc: 0 loss: 1.4094 grad: 1.47e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.619 data: 0.0694 lr: 7.07e-05 mem: 47% pow: 648.772 W 0: INFO 26-04-29 02:18:24.628004 - 1:00:53 - step: 2470 acc: 0 loss: 1.3864 grad: 1.54e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6057 data: 0.0694 lr: 7.07e-05 mem: 47% pow: 660.993 W 0: INFO 26-04-29 02:18:38.115059 - 1:01:06 - step: 2480 acc: 0 loss: 1.4904 grad: 1.52e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6862 data: 0.0383 lr: 7.07e-05 mem: 47% pow: 629.728 W 0: INFO 26-04-29 02:18:53.624421 - 1:01:22 - step: 2490 acc: 0 loss: 1.2673 grad: 1.64e-01 flops: 3.64e+14 wps: 4.23e+04 iter: 0.6147 data: 0.0674 lr: 7.07e-05 mem: 47% pow: 652.211 W 0: INFO 26-04-29 02:19:07.035648 - 1:01:35 - step: 2500 acc: 0 loss: 1.5223 grad: 1.71e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6347 data: 0.0663 lr: 7.07e-05 mem: 47% pow: 644.538 W 0: INFO 26-04-29 02:19:23.350131 - 1:01:51 - step: 2510 acc: 0 loss: 1.4654 grad: 1.52e-01 flops: 3.46e+14 wps: 4.02e+04 iter: 0.6203 data: 0.0673 lr: 7.07e-05 mem: 54% pow: 654.173 W 0: INFO 26-04-29 02:19:36.773637 - 1:02:05 - step: 2520 acc: 0 loss: 1.4804 grad: 1.58e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6195 data: 0.0695 lr: 7.07e-05 mem: 47% pow: 655.152 W 0: INFO 26-04-29 02:19:50.282548 - 1:02:18 - step: 2530 acc: 0 loss: 1.2918 grad: 1.59e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6218 data: 0.0691 lr: 7.06e-05 mem: 47% pow: 652.727 W 0: INFO 26-04-29 02:20:03.864680 - 1:02:32 - step: 2540 acc: 0 loss: 1.4752 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6203 data: 0.0692 lr: 7.06e-05 mem: 47% pow: 655.293 W 0: INFO 26-04-29 02:20:17.788979 - 1:02:46 - step: 2550 acc: 0 loss: 1.7706 grad: 1.74e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6297 data: 0.0669 lr: 7.06e-05 mem: 47% pow: 645.715 W 0: INFO 26-04-29 02:20:31.222755 - 1:02:59 - step: 2560 acc: 0 loss: 1.6698 grad: 1.60e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6065 data: 0.0741 lr: 7.06e-05 mem: 47% pow: 657.537 W 0: INFO 26-04-29 02:20:45.000228 - 1:03:13 - step: 2570 acc: 0 loss: 1.4661 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7454 data: 0.0724 lr: 7.06e-05 mem: 47% pow: 577.723 W 0: INFO 26-04-29 02:20:58.606791 - 1:03:27 - step: 2580 acc: 0 loss: 1.4701 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6056 data: 0.0751 lr: 7.06e-05 mem: 47% pow: 650.795 W 0: INFO 26-04-29 02:21:11.963836 - 1:03:40 - step: 2590 acc: 0 loss: 1.5061 grad: 1.58e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6108 data: 0.0719 lr: 7.05e-05 mem: 47% pow: 651.158 W 0: INFO 26-04-29 02:21:25.496929 - 1:03:54 - step: 2600 acc: 0 loss: 1.4621 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5966 data: 0.0753 lr: 7.05e-05 mem: 47% pow: 658.461 W 0: INFO 26-04-29 02:21:42.025801 - 1:04:10 - step: 2610 acc: 0 loss: 1.2133 grad: 1.69e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6031 data: 0.0729 lr: 7.05e-05 mem: 54% pow: 655.83 W 0: INFO 26-04-29 02:21:55.746975 - 1:04:24 - step: 2620 acc: 0 loss: 1.8467 grad: 1.62e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6854 data: 0.07 lr: 7.05e-05 mem: 47% pow: 604.877 W 0: INFO 26-04-29 02:22:09.237006 - 1:04:37 - step: 2630 acc: 0 loss: 1.3058 grad: 1.66e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6307 data: 0.0628 lr: 7.05e-05 mem: 47% pow: 653.257 W 0: INFO 26-04-29 02:22:22.685029 - 1:04:51 - step: 2640 acc: 0 loss: 1.5911 grad: 1.83e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6085 data: 0.073 lr: 7.05e-05 mem: 47% pow: 655.883 W 0: INFO 26-04-29 02:22:36.299988 - 1:05:04 - step: 2650 acc: 0 loss: 1.3464 grad: 1.55e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.65 data: 0.0679 lr: 7.05e-05 mem: 47% pow: 633.19 W 0: INFO 26-04-29 02:22:50.007335 - 1:05:18 - step: 2660 acc: 0 loss: 1.5838 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6349 data: 0.0694 lr: 7.04e-05 mem: 47% pow: 649.528 W 0: INFO 26-04-29 02:23:03.583686 - 1:05:32 - step: 2670 acc: 0 loss: 1.6693 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6045 data: 0.0769 lr: 7.04e-05 mem: 47% pow: 657.491 W 0: INFO 26-04-29 02:23:17.511250 - 1:05:46 - step: 2680 acc: 0 loss: 2.0592 grad: 1.65e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6056 data: 0.0698 lr: 7.04e-05 mem: 47% pow: 657.794 W 0: INFO 26-04-29 02:23:31.194927 - 1:05:59 - step: 2690 acc: 0 loss: 1.5803 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6083 data: 0.0722 lr: 7.04e-05 mem: 47% pow: 656.537 W 0: INFO 26-04-29 02:23:44.943312 - 1:06:13 - step: 2700 acc: 0 loss: 1.4295 grad: 1.81e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.626 data: 0.0631 lr: 7.04e-05 mem: 47% pow: 659.378 W 0: INFO 26-04-29 02:24:01.936512 - 1:06:30 - step: 2710 acc: 0 loss: 1.1341 grad: 1.60e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.6005 data: 0.0691 lr: 7.04e-05 mem: 54% pow: 664.454 W 0: INFO 26-04-29 02:24:15.647682 - 1:06:44 - step: 2720 acc: 0 loss: 1.6466 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7269 data: 0.076 lr: 7.04e-05 mem: 47% pow: 597.206 W 0: INFO 26-04-29 02:24:29.311949 - 1:06:57 - step: 2730 acc: 0 loss: 1.8066 grad: 1.63e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6186 data: 0.071 lr: 7.03e-05 mem: 47% pow: 655.833 W 0: INFO 26-04-29 02:24:43.158873 - 1:07:11 - step: 2740 acc: 0 loss: 1.6431 grad: 1.54e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.63 data: 0.0661 lr: 7.03e-05 mem: 47% pow: 642.703 W 0: INFO 26-04-29 02:24:56.956474 - 1:07:25 - step: 2750 acc: 0 loss: 1.645 grad: 1.80e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6169 data: 0.0748 lr: 7.03e-05 mem: 47% pow: 647.287 W 0: INFO 26-04-29 02:25:10.774387 - 1:07:39 - step: 2760 acc: 0 loss: 1.1564 grad: 1.66e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6242 data: 0.0636 lr: 7.03e-05 mem: 47% pow: 662.392 W 0: INFO 26-04-29 02:25:24.520733 - 1:07:53 - step: 2770 acc: 0 loss: 1.5269 grad: 1.64e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6524 data: 0.0703 lr: 7.03e-05 mem: 47% pow: 624.548 W 0: INFO 26-04-29 02:25:38.124861 - 1:08:06 - step: 2780 acc: 0 loss: 1.5621 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6097 data: 0.0681 lr: 7.03e-05 mem: 47% pow: 657.712 W 0: INFO 26-04-29 02:25:51.896916 - 1:08:20 - step: 2790 acc: 0 loss: 1.5508 grad: 1.60e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6165 data: 0.0694 lr: 7.02e-05 mem: 47% pow: 658.736 W 0: INFO 26-04-29 02:26:05.772767 - 1:08:34 - step: 2800 acc: 0 loss: 1.2812 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6182 data: 0.0704 lr: 7.02e-05 mem: 47% pow: 651.077 W 0: INFO 26-04-29 02:26:22.269313 - 1:08:50 - step: 2810 acc: 0 loss: 1.6918 grad: 1.78e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6356 data: 0.0719 lr: 7.02e-05 mem: 54% pow: 644.899 W 0: INFO 26-04-29 02:26:35.977224 - 1:09:04 - step: 2820 acc: 0 loss: 1.4098 grad: 1.64e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6227 data: 0.0654 lr: 7.02e-05 mem: 47% pow: 653.359 W 0: INFO 26-04-29 02:26:49.802547 - 1:09:18 - step: 2830 acc: 0 loss: 1.3665 grad: 1.62e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6485 data: 0.0713 lr: 7.02e-05 mem: 47% pow: 629.48 W 0: INFO 26-04-29 02:27:03.621899 - 1:09:32 - step: 2840 acc: 0 loss: 1.5616 grad: 1.70e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.611 data: 0.066 lr: 7.02e-05 mem: 47% pow: 654.118 W 0: INFO 26-04-29 02:27:17.227092 - 1:09:45 - step: 2850 acc: 0 loss: 1.6541 grad: 1.84e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6104 data: 0.0707 lr: 7.02e-05 mem: 47% pow: 652.626 W 0: INFO 26-04-29 02:27:31.314297 - 1:09:59 - step: 2860 acc: 0 loss: 1.45 grad: 1.71e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5839 data: 0.0815 lr: 7.01e-05 mem: 47% pow: 661.628 W 0: INFO 26-04-29 02:27:45.018076 - 1:10:13 - step: 2870 acc: 0 loss: 1.4669 grad: 1.83e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6278 data: 0.0624 lr: 7.01e-05 mem: 47% pow: 656.943 W 0: INFO 26-04-29 02:27:58.666272 - 1:10:27 - step: 2880 acc: 0 loss: 1.6077 grad: 1.71e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6191 data: 0.0756 lr: 7.01e-05 mem: 47% pow: 649.983 W 0: INFO 26-04-29 02:28:12.615716 - 1:10:41 - step: 2890 acc: 0 loss: 1.2668 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7962 data: 0.0717 lr: 7.01e-05 mem: 47% pow: 554.518 W 0: INFO 26-04-29 02:28:26.494616 - 1:10:55 - step: 2900 acc: 0 loss: 1.3882 grad: 2.26e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6407 data: 0.0722 lr: 7.01e-05 mem: 47% pow: 639.814 W 0: INFO 26-04-29 02:28:42.947604 - 1:11:11 - step: 2910 acc: 0 loss: 1.42 grad: 1.86e-01 flops: 3.43e+14 wps: 3.99e+04 iter: 0.6084 data: 0.0723 lr: 7.01e-05 mem: 54% pow: 647.677 W 0: INFO 26-04-29 02:28:56.647998 - 1:11:25 - step: 2920 acc: 0 loss: 1.9805 grad: 1.91e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6125 data: 0.0707 lr: 7.01e-05 mem: 47% pow: 656.943 W 0: INFO 26-04-29 02:29:10.410530 - 1:11:38 - step: 2930 acc: 0 loss: 1.4412 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.606 data: 0.0786 lr: 7.00e-05 mem: 47% pow: 652.176 W 0: INFO 26-04-29 02:29:24.164123 - 1:11:52 - step: 2940 acc: 0 loss: 1.3496 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6152 data: 0.0651 lr: 7.00e-05 mem: 47% pow: 659.564 W 0: INFO 26-04-29 02:29:37.599694 - 1:12:06 - step: 2950 acc: 0 loss: 1.6778 grad: 1.63e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6202 data: 0.0667 lr: 7.00e-05 mem: 47% pow: 653.47 W 0: INFO 26-04-29 02:29:51.182381 - 1:12:19 - step: 2960 acc: 0 loss: 1.3861 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.63 data: 0.0708 lr: 7.00e-05 mem: 47% pow: 641.975 W 0: INFO 26-04-29 02:30:05.096216 - 1:12:33 - step: 2970 acc: 0 loss: 1.2408 grad: 1.71e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7015 data: 0.0028 lr: 7.00e-05 mem: 47% pow: 646.722 W 0: INFO 26-04-29 02:30:18.665704 - 1:12:47 - step: 2980 acc: 0 loss: 1.6627 grad: 2.17e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6247 data: 0.0708 lr: 7.00e-05 mem: 47% pow: 644.318 W 0: INFO 26-04-29 02:30:32.371180 - 1:13:00 - step: 2990 acc: 0 loss: 1.8513 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5973 data: 0.0883 lr: 7.00e-05 mem: 47% pow: 657.304 W 0: INFO 26-04-29 02:30:46.350613 - 1:13:14 - step: 3000 acc: 0 loss: 1.1793 grad: 1.59e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7154 data: 0.0688 lr: 6.99e-05 mem: 47% pow: 606.645 W 0: INFO 26-04-29 02:30:49.959539 - 1:13:18 - garbage collection 0: INFO 26-04-29 02:31:04.182797 - 1:13:32 - step: 3010 acc: 0 loss: 1.7471 grad: 2.29e-01 flops: 3.17e+14 wps: 3.68e+04 iter: 0.6167 data: 0.0644 lr: 6.99e-05 mem: 54% pow: 650.837 W 0: INFO 26-04-29 02:31:17.614225 - 1:13:46 - step: 3020 acc: 0 loss: 1.1712 grad: 4.21e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6217 data: 0.0703 lr: 6.99e-05 mem: 47% pow: 649.416 W 0: INFO 26-04-29 02:31:31.029677 - 1:13:59 - step: 3030 acc: 0 loss: 1.4315 grad: 1.61e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6234 data: 0.0736 lr: 6.99e-05 mem: 47% pow: 647.173 W 0: INFO 26-04-29 02:31:44.569078 - 1:14:13 - step: 3040 acc: 0 loss: 1.3889 grad: 2.31e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6305 data: 0.0609 lr: 6.99e-05 mem: 47% pow: 650.055 W 0: INFO 26-04-29 02:31:58.281905 - 1:14:26 - step: 3050 acc: 0 loss: 1.0896 grad: 2.10e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6462 data: 0.0664 lr: 6.99e-05 mem: 47% pow: 641.737 W 0: INFO 26-04-29 02:32:12.168920 - 1:14:40 - step: 3060 acc: 0 loss: 1.5978 grad: 1.58e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6019 data: 0.0776 lr: 6.98e-05 mem: 47% pow: 663.694 W 0: INFO 26-04-29 02:32:25.819012 - 1:14:54 - step: 3070 acc: 0 loss: 1.5986 grad: 1.71e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6177 data: 0.0738 lr: 6.98e-05 mem: 47% pow: 651.504 W 0: INFO 26-04-29 02:32:39.755346 - 1:15:08 - step: 3080 acc: 0 loss: 1.8491 grad: 1.88e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6424 data: 0.068 lr: 6.98e-05 mem: 47% pow: 638.892 W 0: INFO 26-04-29 02:32:53.359442 - 1:15:21 - step: 3090 acc: 0 loss: 1.8445 grad: 1.68e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6108 data: 0.0667 lr: 6.98e-05 mem: 47% pow: 659.851 W 0: INFO 26-04-29 02:33:07.005884 - 1:15:35 - step: 3100 acc: 0 loss: 1.3877 grad: 1.66e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6231 data: 0.0726 lr: 6.98e-05 mem: 47% pow: 649.763 W 0: INFO 26-04-29 02:33:23.434322 - 1:15:52 - step: 3110 acc: 0 loss: 1.6496 grad: 1.56e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6235 data: 0.0637 lr: 6.98e-05 mem: 54% pow: 659.152 W 0: INFO 26-04-29 02:33:37.166131 - 1:16:05 - step: 3120 acc: 0 loss: 1.3614 grad: 1.70e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6295 data: 0.0699 lr: 6.98e-05 mem: 47% pow: 642.558 W 0: INFO 26-04-29 02:33:50.805738 - 1:16:19 - step: 3130 acc: 0 loss: 1.5987 grad: 1.85e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.634 data: 0.0788 lr: 6.97e-05 mem: 47% pow: 656.314 W 0: INFO 26-04-29 02:34:04.485686 - 1:16:33 - step: 3140 acc: 0 loss: 1.5604 grad: 1.62e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6144 data: 0.0692 lr: 6.97e-05 mem: 47% pow: 650.254 W 0: INFO 26-04-29 02:34:18.194328 - 1:16:46 - step: 3150 acc: 0 loss: 1.6924 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6089 data: 0.0779 lr: 6.97e-05 mem: 47% pow: 650.397 W 0: INFO 26-04-29 02:34:31.867847 - 1:17:00 - step: 3160 acc: 0 loss: 1.671 grad: 2.22e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.682 data: 0.0379 lr: 6.97e-05 mem: 47% pow: 633.01 W 0: INFO 26-04-29 02:34:45.888426 - 1:17:14 - step: 3170 acc: 0 loss: 1.6567 grad: 1.73e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6232 data: 0.0735 lr: 6.97e-05 mem: 47% pow: 658.465 W 0: INFO 26-04-29 02:34:59.735506 - 1:17:28 - step: 3180 acc: 0 loss: 1.9635 grad: 1.62e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.604 data: 0.0713 lr: 6.97e-05 mem: 47% pow: 669.471 W 0: INFO 26-04-29 02:35:13.278012 - 1:17:41 - step: 3190 acc: 0 loss: 1.9406 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6289 data: 0.066 lr: 6.97e-05 mem: 47% pow: 647.37 W 0: INFO 26-04-29 02:35:27.220207 - 1:17:55 - step: 3200 acc: 0 loss: 1.7245 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7702 data: 0.061 lr: 6.96e-05 mem: 47% pow: 573.41 W 0: INFO 26-04-29 02:35:44.048199 - 1:18:12 - step: 3210 acc: 0 loss: 1.7588 grad: 1.56e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.616 data: 0.0707 lr: 6.96e-05 mem: 54% pow: 648.74 W 0: INFO 26-04-29 02:35:57.527584 - 1:18:26 - step: 3220 acc: 0 loss: 1.4487 grad: 1.69e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6227 data: 0.0698 lr: 6.96e-05 mem: 47% pow: 650.434 W 0: INFO 26-04-29 02:36:11.157305 - 1:18:39 - step: 3230 acc: 0 loss: 1.8187 grad: 1.66e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6884 data: 0.0673 lr: 6.96e-05 mem: 47% pow: 608.03 W 0: INFO 26-04-29 02:36:24.851098 - 1:18:53 - step: 3240 acc: 0 loss: 1.5526 grad: 1.66e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6733 data: 0.069 lr: 6.96e-05 mem: 47% pow: 616.329 W 0: INFO 26-04-29 02:36:38.700531 - 1:19:07 - step: 3250 acc: 0 loss: 1.6201 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.633 data: 0.0636 lr: 6.96e-05 mem: 47% pow: 641.533 W 0: INFO 26-04-29 02:36:52.192826 - 1:19:20 - step: 3260 acc: 0 loss: 1.9103 grad: 1.66e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6287 data: 0.0714 lr: 6.96e-05 mem: 47% pow: 638.307 W 0: INFO 26-04-29 02:37:06.116314 - 1:19:34 - step: 3270 acc: 0 loss: 1.864 grad: 1.83e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6073 data: 0.0653 lr: 6.95e-05 mem: 47% pow: 667.133 W 0: INFO 26-04-29 02:37:19.692058 - 1:19:48 - step: 3280 acc: 0 loss: 1.7193 grad: 1.76e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6177 data: 0.0713 lr: 6.95e-05 mem: 47% pow: 645.851 W 0: INFO 26-04-29 02:37:33.288106 - 1:20:01 - step: 3290 acc: 0 loss: 1.6773 grad: 1.67e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6118 data: 0.0648 lr: 6.95e-05 mem: 47% pow: 654.599 W 0: INFO 26-04-29 02:37:49.074288 - 1:20:17 - step: 3300 acc: 0 loss: 1.665 grad: 1.68e-01 flops: 3.58e+14 wps: 4.15e+04 iter: 0.6172 data: 0.073 lr: 6.95e-05 mem: 47% pow: 655.503 W 0: INFO 26-04-29 02:38:05.649006 - 1:20:34 - step: 3310 acc: 0 loss: 1.3595 grad: 1.67e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6061 data: 0.071 lr: 6.95e-05 mem: 54% pow: 649.449 W 0: INFO 26-04-29 02:38:19.365807 - 1:20:47 - step: 3320 acc: 0 loss: 1.4665 grad: 1.90e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6203 data: 0.0796 lr: 6.95e-05 mem: 47% pow: 655.951 W 0: INFO 26-04-29 02:38:35.653904 - 1:21:04 - step: 3330 acc: 0 loss: 1.6575 grad: 1.62e-01 flops: 3.47e+14 wps: 4.02e+04 iter: 0.6443 data: 0.074 lr: 6.94e-05 mem: 47% pow: 646.807 W 0: INFO 26-04-29 02:38:49.565338 - 1:21:18 - step: 3340 acc: 0 loss: 1.7922 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6191 data: 0.0638 lr: 6.94e-05 mem: 47% pow: 651.828 W 0: INFO 26-04-29 02:39:03.331123 - 1:21:31 - step: 3350 acc: 0 loss: 1.5281 grad: 1.64e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7134 data: 0.0743 lr: 6.94e-05 mem: 47% pow: 604.958 W 0: INFO 26-04-29 02:39:17.085681 - 1:21:45 - step: 3360 acc: 0 loss: 1.4573 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7347 data: 0.0688 lr: 6.94e-05 mem: 47% pow: 583.607 W 0: INFO 26-04-29 02:39:30.508439 - 1:21:59 - step: 3370 acc: 0 loss: 1.67 grad: 1.68e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6284 data: 0.0648 lr: 6.94e-05 mem: 47% pow: 658.089 W 0: INFO 26-04-29 02:39:44.247361 - 1:22:12 - step: 3380 acc: 0 loss: 1.5881 grad: 1.80e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6871 data: 0.0702 lr: 6.94e-05 mem: 47% pow: 609.527 W 0: INFO 26-04-29 02:39:57.904166 - 1:22:26 - step: 3390 acc: 0 loss: 1.5526 grad: 1.97e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6599 data: 0.0619 lr: 6.94e-05 mem: 47% pow: 629.331 W 0: INFO 26-04-29 02:40:11.596047 - 1:22:40 - step: 3400 acc: 0 loss: 1.8987 grad: 1.85e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.7785 data: 0.0706 lr: 6.93e-05 mem: 47% pow: 564.003 W 0: INFO 26-04-29 02:40:28.385866 - 1:22:56 - step: 3410 acc: 0 loss: 1.7602 grad: 1.66e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6399 data: 0.0618 lr: 6.93e-05 mem: 54% pow: 648.613 W 0: INFO 26-04-29 02:40:42.406156 - 1:23:10 - step: 3420 acc: 0 loss: 1.7142 grad: 1.63e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6715 data: 0.0533 lr: 6.93e-05 mem: 47% pow: 625.035 W 0: INFO 26-04-29 02:40:56.299443 - 1:23:24 - step: 3430 acc: 0 loss: 1.4812 grad: 1.72e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6254 data: 0.0648 lr: 6.93e-05 mem: 47% pow: 652.984 W 0: INFO 26-04-29 02:41:10.049296 - 1:23:38 - step: 3440 acc: 0 loss: 1.7607 grad: 2.10e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6192 data: 0.0674 lr: 6.93e-05 mem: 47% pow: 650.7 W 0: INFO 26-04-29 02:41:23.591622 - 1:23:52 - step: 3450 acc: 0 loss: 1.4903 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6119 data: 0.0694 lr: 6.93e-05 mem: 47% pow: 653.05 W 0: INFO 26-04-29 02:41:37.209787 - 1:24:05 - step: 3460 acc: 0 loss: 1.8318 grad: 1.84e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6432 data: 0.0517 lr: 6.93e-05 mem: 47% pow: 666.011 W 0: INFO 26-04-29 02:41:50.826053 - 1:24:19 - step: 3470 acc: 0 loss: 1.5432 grad: 1.66e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6247 data: 0.0684 lr: 6.92e-05 mem: 47% pow: 647.448 W 0: INFO 26-04-29 02:42:04.619458 - 1:24:33 - step: 3480 acc: 0 loss: 1.7045 grad: 1.56e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6207 data: 0.077 lr: 6.92e-05 mem: 47% pow: 642.936 W 0: INFO 26-04-29 02:42:18.164683 - 1:24:46 - step: 3490 acc: 0 loss: 1.8293 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6904 data: 0.0026 lr: 6.92e-05 mem: 47% pow: 659.258 W 0: INFO 26-04-29 02:42:31.767398 - 1:25:00 - step: 3500 acc: 0 loss: 1.2814 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6264 data: 0.0678 lr: 6.92e-05 mem: 47% pow: 652.209 W 0: INFO 26-04-29 02:42:48.212280 - 1:25:16 - step: 3510 acc: 0 loss: 1.6372 grad: 1.67e-01 flops: 3.43e+14 wps: 3.99e+04 iter: 0.6225 data: 0.0675 lr: 6.92e-05 mem: 54% pow: 651.393 W 0: INFO 26-04-29 02:43:01.962858 - 1:25:30 - step: 3520 acc: 0 loss: 1.7345 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.618 data: 0.0701 lr: 6.92e-05 mem: 47% pow: 657.717 W 0: INFO 26-04-29 02:43:15.403219 - 1:25:43 - step: 3530 acc: 0 loss: 1.8938 grad: 1.76e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6262 data: 0.0559 lr: 6.91e-05 mem: 47% pow: 649.331 W 0: INFO 26-04-29 02:43:28.839489 - 1:25:57 - step: 3540 acc: 0 loss: 1.4251 grad: 1.59e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6281 data: 0.0688 lr: 6.91e-05 mem: 47% pow: 639.741 W 0: INFO 26-04-29 02:43:42.823184 - 1:26:11 - step: 3550 acc: 0 loss: 1.4098 grad: 1.67e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6188 data: 0.0752 lr: 6.91e-05 mem: 47% pow: 646.526 W 0: INFO 26-04-29 02:43:56.247249 - 1:26:24 - step: 3560 acc: 0 loss: 2.0715 grad: 1.60e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6155 data: 0.0664 lr: 6.91e-05 mem: 47% pow: 643.985 W 0: INFO 26-04-29 02:44:10.015683 - 1:26:38 - step: 3570 acc: 0 loss: 1.6825 grad: 1.72e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6382 data: 0.063 lr: 6.91e-05 mem: 47% pow: 644.867 W 0: INFO 26-04-29 02:44:23.690088 - 1:26:52 - step: 3580 acc: 0 loss: 1.6582 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.673 data: 0.0447 lr: 6.91e-05 mem: 47% pow: 630.433 W 0: INFO 26-04-29 02:44:37.724672 - 1:27:06 - step: 3590 acc: 0 loss: 1.4892 grad: 1.63e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6971 data: 0.0661 lr: 6.91e-05 mem: 47% pow: 608.927 W 0: INFO 26-04-29 02:44:51.503292 - 1:27:20 - step: 3600 acc: 0 loss: 1.6258 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6474 data: 0.0692 lr: 6.90e-05 mem: 47% pow: 632.226 W 0: INFO 26-04-29 02:45:08.139240 - 1:27:36 - step: 3610 acc: 0 loss: 1.4365 grad: 1.59e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6064 data: 0.0681 lr: 6.90e-05 mem: 54% pow: 655.369 W 0: INFO 26-04-29 02:45:21.855193 - 1:27:50 - step: 3620 acc: 0 loss: 1.5239 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6042 data: 0.067 lr: 6.90e-05 mem: 47% pow: 668.364 W 0: INFO 26-04-29 02:45:35.500352 - 1:28:04 - step: 3630 acc: 0 loss: 1.8021 grad: 1.63e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6885 data: 0.0698 lr: 6.90e-05 mem: 47% pow: 605.641 W 0: INFO 26-04-29 02:45:49.302755 - 1:28:17 - step: 3640 acc: 0 loss: 1.8286 grad: 1.66e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6252 data: 0.0669 lr: 6.90e-05 mem: 47% pow: 649.002 W 0: INFO 26-04-29 02:46:02.849066 - 1:28:31 - step: 3650 acc: 0 loss: 1.8164 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6081 data: 0.0675 lr: 6.90e-05 mem: 47% pow: 664.335 W 0: INFO 26-04-29 02:46:16.514504 - 1:28:45 - step: 3660 acc: 0 loss: 1.355 grad: 1.49e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6002 data: 0.0691 lr: 6.90e-05 mem: 47% pow: 667.97 W 0: INFO 26-04-29 02:46:30.259152 - 1:28:58 - step: 3670 acc: 0 loss: 1.3388 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6361 data: 0.068 lr: 6.89e-05 mem: 47% pow: 637.457 W 0: INFO 26-04-29 02:46:44.000421 - 1:29:12 - step: 3680 acc: 0 loss: 1.3453 grad: 1.69e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6087 data: 0.0701 lr: 6.89e-05 mem: 47% pow: 650.868 W 0: INFO 26-04-29 02:46:58.175401 - 1:29:26 - step: 3690 acc: 0 loss: 1.809 grad: 1.55e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6068 data: 0.0699 lr: 6.89e-05 mem: 47% pow: 654.03 W 0: INFO 26-04-29 02:47:11.845315 - 1:29:40 - step: 3700 acc: 0 loss: 1.4798 grad: 1.70e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.7205 data: 0.0618 lr: 6.89e-05 mem: 47% pow: 596.81 W 0: INFO 26-04-29 02:47:28.541244 - 1:29:57 - step: 3710 acc: 0 loss: 1.555 grad: 1.73e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6714 data: 0.0624 lr: 6.89e-05 mem: 54% pow: 624.894 W 0: INFO 26-04-29 02:47:42.448014 - 1:30:11 - step: 3720 acc: 0 loss: 1.6995 grad: 1.66e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6392 data: 0.0657 lr: 6.89e-05 mem: 47% pow: 640.828 W 0: INFO 26-04-29 02:47:56.061229 - 1:30:24 - step: 3730 acc: 0 loss: 1.1423 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6134 data: 0.063 lr: 6.89e-05 mem: 47% pow: 656.997 W 0: INFO 26-04-29 02:48:09.903165 - 1:30:38 - step: 3740 acc: 0 loss: 2.3073 grad: 1.63e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6248 data: 0.0712 lr: 6.88e-05 mem: 47% pow: 644.899 W 0: INFO 26-04-29 02:48:23.625680 - 1:30:52 - step: 3750 acc: 0 loss: 1.4436 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6099 data: 0.0737 lr: 6.88e-05 mem: 47% pow: 652.672 W 0: INFO 26-04-29 02:48:37.384386 - 1:31:05 - step: 3760 acc: 0 loss: 1.5789 grad: 1.63e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6246 data: 0.0679 lr: 6.88e-05 mem: 47% pow: 652.928 W 0: INFO 26-04-29 02:48:51.001346 - 1:31:19 - step: 3770 acc: 0 loss: 1.5616 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6288 data: 0.0635 lr: 6.88e-05 mem: 47% pow: 653.15 W 0: INFO 26-04-29 02:49:04.761288 - 1:31:33 - step: 3780 acc: 0 loss: 1.3382 grad: 1.56e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6026 data: 0.0739 lr: 6.88e-05 mem: 47% pow: 658.081 W 0: INFO 26-04-29 02:49:18.483567 - 1:31:47 - step: 3790 acc: 0 loss: 1.3505 grad: 1.65e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.63 data: 0.0699 lr: 6.88e-05 mem: 47% pow: 644.901 W 0: INFO 26-04-29 02:49:32.087113 - 1:32:00 - step: 3800 acc: 0 loss: 1.7981 grad: 1.67e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6357 data: 0.0696 lr: 6.87e-05 mem: 47% pow: 639.718 W 0: INFO 26-04-29 02:49:48.557249 - 1:32:17 - step: 3810 acc: 0 loss: 1.9577 grad: 1.54e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6116 data: 0.0646 lr: 6.87e-05 mem: 54% pow: 654.715 W 0: INFO 26-04-29 02:50:02.381501 - 1:32:30 - step: 3820 acc: 0 loss: 1.4354 grad: 1.57e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6166 data: 0.0704 lr: 6.87e-05 mem: 47% pow: 664.511 W 0: INFO 26-04-29 02:50:16.017600 - 1:32:44 - step: 3830 acc: 0 loss: 1.2078 grad: 1.60e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6196 data: 0.0675 lr: 6.87e-05 mem: 47% pow: 654.0 W 0: INFO 26-04-29 02:50:29.456397 - 1:32:58 - step: 3840 acc: 0 loss: 1.3276 grad: 1.75e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6203 data: 0.0722 lr: 6.87e-05 mem: 47% pow: 660.176 W 0: INFO 26-04-29 02:50:43.068168 - 1:33:11 - step: 3850 acc: 0 loss: 1.9105 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6499 data: 0.0675 lr: 6.87e-05 mem: 47% pow: 634.02 W 0: INFO 26-04-29 02:50:56.738600 - 1:33:25 - step: 3860 acc: 0 loss: 1.5967 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6018 data: 0.0758 lr: 6.87e-05 mem: 47% pow: 655.245 W 0: INFO 26-04-29 02:51:10.507353 - 1:33:39 - step: 3870 acc: 0 loss: 1.8631 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6267 data: 0.0574 lr: 6.86e-05 mem: 47% pow: 652.711 W 0: INFO 26-04-29 02:51:24.130684 - 1:33:52 - step: 3880 acc: 0 loss: 1.6701 grad: 1.58e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.61 data: 0.0661 lr: 6.86e-05 mem: 47% pow: 659.835 W 0: INFO 26-04-29 02:51:37.636738 - 1:34:06 - step: 3890 acc: 0 loss: 1.3946 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6405 data: 0.067 lr: 6.86e-05 mem: 47% pow: 655.339 W 0: INFO 26-04-29 02:51:51.136165 - 1:34:19 - step: 3900 acc: 0 loss: 1.4813 grad: 1.54e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6564 data: 0.0498 lr: 6.86e-05 mem: 47% pow: 657.51 W 0: INFO 26-04-29 02:52:08.161312 - 1:34:36 - step: 3910 acc: 0 loss: 1.6271 grad: 1.65e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.6332 data: 0.0667 lr: 6.86e-05 mem: 54% pow: 658.5 W 0: INFO 26-04-29 02:52:21.663293 - 1:34:50 - step: 3920 acc: 0 loss: 1.5961 grad: 1.56e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6042 data: 0.0736 lr: 6.86e-05 mem: 47% pow: 656.357 W 0: INFO 26-04-29 02:52:35.449011 - 1:35:04 - step: 3930 acc: 0 loss: 1.6216 grad: 1.48e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6129 data: 0.0723 lr: 6.86e-05 mem: 47% pow: 665.58 W 0: INFO 26-04-29 02:52:49.024867 - 1:35:17 - step: 3940 acc: 0 loss: 1.3103 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6087 data: 0.0658 lr: 6.85e-05 mem: 47% pow: 652.173 W 0: INFO 26-04-29 02:53:02.631315 - 1:35:31 - step: 3950 acc: 0 loss: 1.8256 grad: 1.73e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6469 data: 0.0719 lr: 6.85e-05 mem: 47% pow: 630.091 W 0: INFO 26-04-29 02:53:16.722176 - 1:35:45 - step: 3960 acc: 0 loss: 1.466 grad: 1.52e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6317 data: 0.0691 lr: 6.85e-05 mem: 47% pow: 638.517 W 0: INFO 26-04-29 02:53:30.228727 - 1:35:58 - step: 3970 acc: 0 loss: 1.7355 grad: 1.57e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6467 data: 0.0712 lr: 6.85e-05 mem: 47% pow: 626.278 W 0: INFO 26-04-29 02:53:43.966972 - 1:36:12 - step: 3980 acc: 0 loss: 1.8291 grad: 1.71e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6548 data: 0.0684 lr: 6.85e-05 mem: 47% pow: 636.098 W 0: INFO 26-04-29 02:53:58.082393 - 1:36:26 - step: 3990 acc: 0 loss: 1.8093 grad: 1.56e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6099 data: 0.0705 lr: 6.85e-05 mem: 47% pow: 650.928 W 0: INFO 26-04-29 02:54:11.797618 - 1:36:40 - step: 4000 acc: 0 loss: 1.4949 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6256 data: 0.0673 lr: 6.84e-05 mem: 47% pow: 668.66 W 0: INFO 26-04-29 02:54:15.464075 - 1:36:44 - garbage collection 0: INFO 26-04-29 02:54:29.944910 - 1:36:58 - step: 4010 acc: 0 loss: 1.7175 grad: 1.60e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.6369 data: 0.0611 lr: 6.84e-05 mem: 54% pow: 635.34 W 0: INFO 26-04-29 02:54:43.633107 - 1:37:12 - step: 4020 acc: 0 loss: 1.5776 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5978 data: 0.0844 lr: 6.84e-05 mem: 47% pow: 653.808 W 0: INFO 26-04-29 02:54:57.201029 - 1:37:25 - step: 4030 acc: 0 loss: 1.896 grad: 1.76e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6166 data: 0.0736 lr: 6.84e-05 mem: 47% pow: 645.758 W 0: INFO 26-04-29 02:55:10.757256 - 1:37:39 - step: 4040 acc: 0 loss: 1.5517 grad: 1.72e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5882 data: 0.087 lr: 6.84e-05 mem: 47% pow: 672.089 W 0: INFO 26-04-29 02:55:24.255757 - 1:37:52 - step: 4050 acc: 0 loss: 1.6947 grad: 1.57e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6155 data: 0.066 lr: 6.84e-05 mem: 47% pow: 671.283 W 0: INFO 26-04-29 02:55:37.929904 - 1:38:06 - step: 4060 acc: 0 loss: 1.6407 grad: 1.53e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.607 data: 0.0727 lr: 6.84e-05 mem: 47% pow: 659.312 W 0: INFO 26-04-29 02:55:51.641102 - 1:38:20 - step: 4070 acc: 0 loss: 1.529 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6487 data: 0.0661 lr: 6.83e-05 mem: 47% pow: 644.826 W 0: INFO 26-04-29 02:56:05.409959 - 1:38:33 - step: 4080 acc: 0 loss: 1.7823 grad: 1.52e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6158 data: 0.0728 lr: 6.83e-05 mem: 47% pow: 660.825 W 0: INFO 26-04-29 02:56:19.364692 - 1:38:47 - step: 4090 acc: 0 loss: 1.4111 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6117 data: 0.0771 lr: 6.83e-05 mem: 47% pow: 662.82 W 0: INFO 26-04-29 02:56:33.144914 - 1:39:01 - step: 4100 acc: 0 loss: 1.5814 grad: 2.67e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7652 data: 0.0721 lr: 6.83e-05 mem: 47% pow: 565.643 W 0: INFO 26-04-29 02:56:50.300732 - 1:39:18 - step: 4110 acc: 0 loss: 1.7081 grad: 1.75e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6673 data: 0.0028 lr: 6.83e-05 mem: 54% pow: 664.862 W 0: INFO 26-04-29 02:57:04.009112 - 1:39:32 - step: 4120 acc: 0 loss: 1.7493 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6344 data: 0.0632 lr: 6.83e-05 mem: 47% pow: 645.6 W 0: INFO 26-04-29 02:57:17.512802 - 1:39:46 - step: 4130 acc: 0 loss: 1.2499 grad: 1.72e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5921 data: 0.0766 lr: 6.83e-05 mem: 47% pow: 667.258 W 0: INFO 26-04-29 02:57:31.242447 - 1:39:59 - step: 4140 acc: 0 loss: 1.5348 grad: 1.76e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6169 data: 0.0646 lr: 6.82e-05 mem: 47% pow: 659.123 W 0: INFO 26-04-29 02:57:44.759133 - 1:40:13 - step: 4150 acc: 0 loss: 1.3354 grad: 1.59e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6102 data: 0.0682 lr: 6.82e-05 mem: 47% pow: 658.393 W 0: INFO 26-04-29 02:57:58.442649 - 1:40:27 - step: 4160 acc: 0 loss: 1.4545 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6187 data: 0.0597 lr: 6.82e-05 mem: 47% pow: 653.291 W 0: INFO 26-04-29 02:58:12.022932 - 1:40:40 - step: 4170 acc: 0 loss: 1.194 grad: 1.84e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5934 data: 0.0837 lr: 6.82e-05 mem: 47% pow: 656.852 W 0: INFO 26-04-29 02:58:25.670862 - 1:40:54 - step: 4180 acc: 0 loss: 1.3149 grad: 1.63e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6077 data: 0.0698 lr: 6.82e-05 mem: 47% pow: 659.361 W 0: INFO 26-04-29 02:58:39.303862 - 1:41:07 - step: 4190 acc: 0 loss: 2.04 grad: 1.54e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.624 data: 0.0723 lr: 6.82e-05 mem: 47% pow: 646.381 W 0: INFO 26-04-29 02:58:52.768741 - 1:41:21 - step: 4200 acc: 0 loss: 1.5175 grad: 1.55e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6294 data: 0.0561 lr: 6.82e-05 mem: 47% pow: 656.809 W 0: INFO 26-04-29 02:59:10.219502 - 1:41:38 - step: 4210 acc: 0 loss: 1.7918 grad: 1.57e-01 flops: 3.24e+14 wps: 3.76e+04 iter: 0.6236 data: 0.0639 lr: 6.81e-05 mem: 54% pow: 652.126 W 0: INFO 26-04-29 02:59:23.869588 - 1:41:52 - step: 4220 acc: 0 loss: 1.6852 grad: 1.72e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6702 data: 0.0707 lr: 6.81e-05 mem: 47% pow: 614.605 W 0: INFO 26-04-29 02:59:37.968255 - 1:42:06 - step: 4230 acc: 0 loss: 1.793 grad: 1.76e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.715 data: 0.0675 lr: 6.81e-05 mem: 47% pow: 598.13 W 0: INFO 26-04-29 02:59:51.499195 - 1:42:20 - step: 4240 acc: 0 loss: 1.4179 grad: 1.63e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.629 data: 0.0672 lr: 6.81e-05 mem: 47% pow: 650.178 W 0: INFO 26-04-29 03:00:05.476279 - 1:42:34 - step: 4250 acc: 0 loss: 1.731 grad: 1.68e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6092 data: 0.0683 lr: 6.81e-05 mem: 47% pow: 661.047 W 0: INFO 26-04-29 03:00:19.163384 - 1:42:47 - step: 4260 acc: 0 loss: 1.8238 grad: 1.62e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6373 data: 0.0642 lr: 6.81e-05 mem: 47% pow: 642.531 W 0: INFO 26-04-29 03:00:33.081666 - 1:43:01 - step: 4270 acc: 0 loss: 1.3016 grad: 1.57e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6558 data: 0.0643 lr: 6.80e-05 mem: 47% pow: 631.373 W 0: INFO 26-04-29 03:00:46.763893 - 1:43:15 - step: 4280 acc: 0 loss: 1.3901 grad: 1.74e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6215 data: 0.0706 lr: 6.80e-05 mem: 47% pow: 654.96 W 0: INFO 26-04-29 03:01:00.461213 - 1:43:29 - step: 4290 acc: 0 loss: 1.8371 grad: 1.74e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6491 data: 0.0713 lr: 6.80e-05 mem: 47% pow: 625.84 W 0: INFO 26-04-29 03:01:14.164169 - 1:43:42 - step: 4300 acc: 0 loss: 1.7233 grad: 1.70e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6231 data: 0.0726 lr: 6.80e-05 mem: 47% pow: 642.076 W 0: INFO 26-04-29 03:01:30.865827 - 1:43:59 - step: 4310 acc: 0 loss: 1.42 grad: 1.79e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.7748 data: 0.0701 lr: 6.80e-05 mem: 54% pow: 565.432 W 0: INFO 26-04-29 03:01:45.244379 - 1:44:13 - step: 4320 acc: 0 loss: 1.6891 grad: 1.61e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6581 data: 0.0719 lr: 6.80e-05 mem: 47% pow: 627.691 W 0: INFO 26-04-29 03:01:58.802548 - 1:44:27 - step: 4330 acc: 0 loss: 1.9326 grad: 1.62e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6328 data: 0.0676 lr: 6.80e-05 mem: 47% pow: 645.755 W 0: INFO 26-04-29 03:02:12.501600 - 1:44:41 - step: 4340 acc: 0 loss: 1.5434 grad: 1.59e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6128 data: 0.0666 lr: 6.79e-05 mem: 47% pow: 652.623 W 0: INFO 26-04-29 03:02:26.357384 - 1:44:54 - step: 4350 acc: 0 loss: 1.4104 grad: 1.72e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6145 data: 0.0728 lr: 6.79e-05 mem: 47% pow: 676.719 W 0: INFO 26-04-29 03:02:40.124715 - 1:45:08 - step: 4360 acc: 0 loss: 1.5305 grad: 1.84e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6327 data: 0.0674 lr: 6.79e-05 mem: 47% pow: 646.661 W 0: INFO 26-04-29 03:02:53.845434 - 1:45:22 - step: 4370 acc: 0 loss: 1.3182 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7137 data: 0.0672 lr: 6.79e-05 mem: 47% pow: 592.24 W 0: INFO 26-04-29 03:03:07.676693 - 1:45:36 - step: 4380 acc: 0 loss: 1.891 grad: 1.59e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6249 data: 0.0724 lr: 6.79e-05 mem: 47% pow: 646.045 W 0: INFO 26-04-29 03:03:21.545052 - 1:45:50 - step: 4390 acc: 0 loss: 1.4577 grad: 1.94e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6429 data: 0.0699 lr: 6.79e-05 mem: 47% pow: 636.854 W 0: INFO 26-04-29 03:03:35.179001 - 1:46:03 - step: 4400 acc: 0 loss: 1.7435 grad: 1.84e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6161 data: 0.064 lr: 6.79e-05 mem: 47% pow: 655.458 W 0: INFO 26-04-29 03:03:52.170483 - 1:46:20 - step: 4410 acc: 0 loss: 1.5524 grad: 1.74e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 1.0061 data: 0.0689 lr: 6.78e-05 mem: 54% pow: 438.953 W 0: INFO 26-04-29 03:04:05.716603 - 1:46:34 - step: 4420 acc: 0 loss: 1.4402 grad: 1.65e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6477 data: 0.051 lr: 6.78e-05 mem: 47% pow: 638.698 W 0: INFO 26-04-29 03:04:19.140809 - 1:46:47 - step: 4430 acc: 0 loss: 1.8078 grad: 1.94e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.606 data: 0.0758 lr: 6.78e-05 mem: 47% pow: 651.91 W 0: INFO 26-04-29 03:04:32.988193 - 1:47:01 - step: 4440 acc: 0 loss: 1.8016 grad: 1.63e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6097 data: 0.0732 lr: 6.78e-05 mem: 47% pow: 655.796 W 0: INFO 26-04-29 03:04:47.432568 - 1:47:16 - step: 4450 acc: 0 loss: 1.6837 grad: 2.04e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6271 data: 0.0619 lr: 6.78e-05 mem: 47% pow: 654.428 W 0: INFO 26-04-29 03:05:01.288084 - 1:47:29 - step: 4460 acc: 0 loss: 1.5953 grad: 1.62e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6266 data: 0.0627 lr: 6.78e-05 mem: 47% pow: 657.49 W 0: INFO 26-04-29 03:05:15.161790 - 1:47:43 - step: 4470 acc: 0 loss: 1.535 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6102 data: 0.0739 lr: 6.78e-05 mem: 47% pow: 654.29 W 0: INFO 26-04-29 03:05:28.693313 - 1:47:57 - step: 4480 acc: 0 loss: 1.8292 grad: 1.62e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6331 data: 0.068 lr: 6.77e-05 mem: 47% pow: 650.682 W 0: INFO 26-04-29 03:05:42.304348 - 1:48:10 - step: 4490 acc: 0 loss: 1.6098 grad: 1.81e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6302 data: 0.0386 lr: 6.77e-05 mem: 47% pow: 667.784 W 0: INFO 26-04-29 03:05:55.949252 - 1:48:24 - step: 4500 acc: 0 loss: 1.4214 grad: 1.69e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.636 data: 0.0756 lr: 6.77e-05 mem: 47% pow: 634.138 W 0: INFO 26-04-29 03:06:12.705044 - 1:48:41 - step: 4510 acc: 0 loss: 1.549 grad: 1.69e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6357 data: 0.0685 lr: 6.77e-05 mem: 54% pow: 660.85 W 0: INFO 26-04-29 03:06:26.389679 - 1:48:54 - step: 4520 acc: 0 loss: 1.5114 grad: 1.69e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6604 data: 0.0672 lr: 6.77e-05 mem: 47% pow: 647.17 W 0: INFO 26-04-29 03:06:40.146719 - 1:49:08 - step: 4530 acc: 0 loss: 1.6056 grad: 1.62e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6849 data: 0.066 lr: 6.77e-05 mem: 47% pow: 617.225 W 0: INFO 26-04-29 03:06:53.865538 - 1:49:22 - step: 4540 acc: 0 loss: 1.4532 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.626 data: 0.0685 lr: 6.76e-05 mem: 47% pow: 643.644 W 0: INFO 26-04-29 03:07:07.524752 - 1:49:36 - step: 4550 acc: 0 loss: 1.8471 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6322 data: 0.069 lr: 6.76e-05 mem: 47% pow: 642.618 W 0: INFO 26-04-29 03:07:21.250159 - 1:49:49 - step: 4560 acc: 0 loss: 1.4729 grad: 1.57e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6261 data: 0.0684 lr: 6.76e-05 mem: 47% pow: 649.583 W 0: INFO 26-04-29 03:07:34.958545 - 1:50:03 - step: 4570 acc: 0 loss: 1.312 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6793 data: 0.0744 lr: 6.76e-05 mem: 47% pow: 607.474 W 0: INFO 26-04-29 03:07:48.533721 - 1:50:17 - step: 4580 acc: 0 loss: 1.37 grad: 1.87e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6399 data: 0.0566 lr: 6.76e-05 mem: 47% pow: 655.644 W 0: INFO 26-04-29 03:08:02.061013 - 1:50:30 - step: 4590 acc: 0 loss: 1.3668 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6083 data: 0.0642 lr: 6.76e-05 mem: 47% pow: 670.968 W 0: INFO 26-04-29 03:08:15.568151 - 1:50:44 - step: 4600 acc: 0 loss: 1.5282 grad: 1.64e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6018 data: 0.0719 lr: 6.76e-05 mem: 47% pow: 659.968 W 0: INFO 26-04-29 03:08:32.038847 - 1:51:00 - step: 4610 acc: 0 loss: 1.4709 grad: 1.82e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.611 data: 0.0713 lr: 6.75e-05 mem: 54% pow: 648.023 W 0: INFO 26-04-29 03:08:46.251171 - 1:51:14 - step: 4620 acc: 0 loss: 1.3467 grad: 1.66e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6335 data: 0.042 lr: 6.75e-05 mem: 47% pow: 661.009 W 0: INFO 26-04-29 03:08:59.893567 - 1:51:28 - step: 4630 acc: 0 loss: 1.7444 grad: 1.60e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6097 data: 0.0592 lr: 6.75e-05 mem: 47% pow: 663.15 W 0: INFO 26-04-29 03:09:13.655019 - 1:51:42 - step: 4640 acc: 0 loss: 1.7252 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7476 data: 0.0664 lr: 6.75e-05 mem: 47% pow: 579.66 W 0: INFO 26-04-29 03:09:27.085444 - 1:51:55 - step: 4650 acc: 0 loss: 1.6694 grad: 1.58e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6395 data: 0.0708 lr: 6.75e-05 mem: 47% pow: 645.859 W 0: INFO 26-04-29 03:09:40.661404 - 1:52:09 - step: 4660 acc: 0 loss: 1.5563 grad: 1.63e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.665 data: 0.0712 lr: 6.75e-05 mem: 47% pow: 620.296 W 0: INFO 26-04-29 03:09:54.538461 - 1:52:23 - step: 4670 acc: 0 loss: 1.7389 grad: 1.66e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6944 data: 0.0024 lr: 6.75e-05 mem: 47% pow: 635.944 W 0: INFO 26-04-29 03:10:08.117852 - 1:52:36 - step: 4680 acc: 0 loss: 1.4843 grad: 1.84e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6141 data: 0.0708 lr: 6.74e-05 mem: 47% pow: 649.103 W 0: INFO 26-04-29 03:10:21.636203 - 1:52:50 - step: 4690 acc: 0 loss: 1.5661 grad: 1.72e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6094 data: 0.0724 lr: 6.74e-05 mem: 47% pow: 656.939 W 0: INFO 26-04-29 03:10:34.994066 - 1:53:03 - step: 4700 acc: 0 loss: 1.6365 grad: 1.54e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6235 data: 0.0739 lr: 6.74e-05 mem: 47% pow: 650.106 W 0: INFO 26-04-29 03:10:51.389278 - 1:53:19 - step: 4710 acc: 0 loss: 1.3645 grad: 1.78e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.6334 data: 0.0423 lr: 6.74e-05 mem: 54% pow: 663.648 W 0: INFO 26-04-29 03:11:04.925129 - 1:53:33 - step: 4720 acc: 0 loss: 1.6146 grad: 1.60e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.625 data: 0.0659 lr: 6.74e-05 mem: 47% pow: 644.404 W 0: INFO 26-04-29 03:11:18.876321 - 1:53:47 - step: 4730 acc: 0 loss: 1.6216 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6192 data: 0.0754 lr: 6.74e-05 mem: 47% pow: 644.097 W 0: INFO 26-04-29 03:11:32.666913 - 1:54:01 - step: 4740 acc: 0 loss: 1.7873 grad: 1.52e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6208 data: 0.0708 lr: 6.73e-05 mem: 47% pow: 659.343 W 0: INFO 26-04-29 03:11:46.366345 - 1:54:14 - step: 4750 acc: 0 loss: 1.4691 grad: 1.61e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6137 data: 0.0693 lr: 6.73e-05 mem: 47% pow: 655.39 W 0: INFO 26-04-29 03:11:59.902226 - 1:54:28 - step: 4760 acc: 0 loss: 1.7903 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6084 data: 0.0738 lr: 6.73e-05 mem: 47% pow: 673.025 W 0: INFO 26-04-29 03:12:13.709809 - 1:54:42 - step: 4770 acc: 0 loss: 1.4813 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6042 data: 0.0694 lr: 6.73e-05 mem: 47% pow: 661.865 W 0: INFO 26-04-29 03:12:27.638210 - 1:54:56 - step: 4780 acc: 0 loss: 1.4363 grad: 1.63e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6326 data: 0.0676 lr: 6.73e-05 mem: 47% pow: 654.329 W 0: INFO 26-04-29 03:12:41.329372 - 1:55:09 - step: 4790 acc: 0 loss: 1.4915 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6663 data: 0.0697 lr: 6.73e-05 mem: 47% pow: 620.447 W 0: INFO 26-04-29 03:12:55.097083 - 1:55:23 - step: 4800 acc: 0 loss: 1.1904 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6034 data: 0.0694 lr: 6.73e-05 mem: 47% pow: 662.885 W 0: INFO 26-04-29 03:13:11.749516 - 1:55:40 - step: 4810 acc: 0 loss: 1.8059 grad: 1.66e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.611 data: 0.0786 lr: 6.72e-05 mem: 54% pow: 663.26 W 0: INFO 26-04-29 03:13:25.191680 - 1:55:53 - step: 4820 acc: 0 loss: 1.5867 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.586 data: 0.1059 lr: 6.72e-05 mem: 47% pow: 659.694 W 0: INFO 26-04-29 03:13:38.796970 - 1:56:07 - step: 4830 acc: 0 loss: 1.584 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6601 data: 0.063 lr: 6.72e-05 mem: 47% pow: 632.893 W 0: INFO 26-04-29 03:13:52.202254 - 1:56:20 - step: 4840 acc: 0 loss: 1.5085 grad: 1.59e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6147 data: 0.0742 lr: 6.72e-05 mem: 47% pow: 647.529 W 0: INFO 26-04-29 03:14:05.941414 - 1:56:34 - step: 4850 acc: 0 loss: 1.737 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6285 data: 0.0593 lr: 6.72e-05 mem: 47% pow: 651.261 W 0: INFO 26-04-29 03:14:19.582937 - 1:56:48 - step: 4860 acc: 0 loss: 1.2813 grad: 1.59e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6051 data: 0.0653 lr: 6.72e-05 mem: 47% pow: 668.355 W 0: INFO 26-04-29 03:14:33.245475 - 1:57:01 - step: 4870 acc: 0 loss: 1.8001 grad: 1.53e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6404 data: 0.0664 lr: 6.72e-05 mem: 47% pow: 642.651 W 0: INFO 26-04-29 03:14:46.800557 - 1:57:15 - step: 4880 acc: 0 loss: 1.9144 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6107 data: 0.0746 lr: 6.71e-05 mem: 47% pow: 650.957 W 0: INFO 26-04-29 03:15:00.549857 - 1:57:29 - step: 4890 acc: 0 loss: 1.8389 grad: 1.81e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6076 data: 0.0641 lr: 6.71e-05 mem: 47% pow: 672.376 W 0: INFO 26-04-29 03:15:14.257503 - 1:57:42 - step: 4900 acc: 0 loss: 1.3574 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6538 data: 0.0418 lr: 6.71e-05 mem: 47% pow: 642.437 W 0: INFO 26-04-29 03:15:31.002488 - 1:57:59 - step: 4910 acc: 0 loss: 1.6544 grad: 1.54e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6174 data: 0.0638 lr: 6.71e-05 mem: 54% pow: 654.588 W 0: INFO 26-04-29 03:15:44.668977 - 1:58:13 - step: 4920 acc: 0 loss: 1.7239 grad: 1.55e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6906 data: 0.0857 lr: 6.71e-05 mem: 47% pow: 598.237 W 0: INFO 26-04-29 03:15:58.360494 - 1:58:26 - step: 4930 acc: 0 loss: 1.4969 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6015 data: 0.0725 lr: 6.71e-05 mem: 47% pow: 660.811 W 0: INFO 26-04-29 03:16:11.963768 - 1:58:40 - step: 4940 acc: 0 loss: 1.7253 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6137 data: 0.0675 lr: 6.71e-05 mem: 47% pow: 657.486 W 0: INFO 26-04-29 03:16:25.709792 - 1:58:54 - step: 4950 acc: 0 loss: 1.7999 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6059 data: 0.0721 lr: 6.70e-05 mem: 47% pow: 656.507 W 0: INFO 26-04-29 03:16:39.265287 - 1:59:07 - step: 4960 acc: 0 loss: 1.6927 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6346 data: 0.051 lr: 6.70e-05 mem: 47% pow: 659.328 W 0: INFO 26-04-29 03:16:52.747777 - 1:59:21 - step: 4970 acc: 0 loss: 1.5405 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5981 data: 0.0768 lr: 6.70e-05 mem: 47% pow: 653.776 W 0: INFO 26-04-29 03:17:06.361754 - 1:59:34 - step: 4980 acc: 0 loss: 1.7678 grad: 2.00e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6141 data: 0.0755 lr: 6.70e-05 mem: 47% pow: 651.238 W 0: INFO 26-04-29 03:17:20.002169 - 1:59:48 - step: 4990 acc: 0 loss: 1.3748 grad: 1.82e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6826 data: 0.0798 lr: 6.70e-05 mem: 47% pow: 617.736 W 0: INFO 26-04-29 03:17:33.672769 - 2:00:02 - step: 5000 acc: 0 loss: 2.045 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6026 data: 0.0708 lr: 6.70e-05 mem: 47% pow: 655.755 W 0: INFO 26-04-29 03:17:33.675349 - 2:00:02 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000005000 0: INFO 26-04-29 03:17:33.675705 - 2:00:02 - Saving... 0: INFO 26-04-29 03:17:39.734033 - 2:00:08 - State dict saved! 0: INFO 26-04-29 03:17:39.818562 - 2:00:08 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000005000/train_state_00000.json 0: INFO 26-04-29 03:17:39.821857 - 2:00:08 - Train state saved ! 0: INFO 26-04-29 03:17:39.822012 - 2:00:08 - Cleaning up checkpoints... 0: INFO 26-04-29 03:17:39.822140 - 2:00:08 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000005000')] 0: INFO 26-04-29 03:17:39.822233 - 2:00:08 - Eval folders: [] 0: INFO 26-04-29 03:17:39.822313 - 2:00:08 - Other folders: [] 0: INFO 26-04-29 03:17:39.822411 - 2:00:08 - Removing folders: set() 0: INFO 26-04-29 03:17:43.485677 - 2:00:12 - garbage collection 0: INFO 26-04-29 03:17:57.809119 - 2:00:26 - step: 5010 acc: 0 loss: 1.7145 grad: 1.65e-01 flops: 2.34e+14 wps: 2.72e+04 iter: 0.6212 data: 0.0756 lr: 6.69e-05 mem: 54% pow: 645.093 W 0: INFO 26-04-29 03:18:11.419133 - 2:00:40 - step: 5020 acc: 0 loss: 1.6645 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6106 data: 0.0777 lr: 6.69e-05 mem: 47% pow: 657.666 W 0: INFO 26-04-29 03:18:25.145317 - 2:00:53 - step: 5030 acc: 0 loss: 1.5512 grad: 1.57e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6538 data: 0.0599 lr: 6.69e-05 mem: 47% pow: 636.598 W 0: INFO 26-04-29 03:18:38.979750 - 2:01:07 - step: 5040 acc: 0 loss: 1.324 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6425 data: 0.069 lr: 6.69e-05 mem: 47% pow: 649.887 W 0: INFO 26-04-29 03:18:52.640155 - 2:01:21 - step: 5050 acc: 0 loss: 1.2374 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.627 data: 0.0727 lr: 6.69e-05 mem: 47% pow: 655.921 W 0: INFO 26-04-29 03:19:06.443157 - 2:01:35 - step: 5060 acc: 0 loss: 1.2707 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6165 data: 0.0678 lr: 6.69e-05 mem: 47% pow: 647.283 W 0: INFO 26-04-29 03:19:20.435798 - 2:01:49 - step: 5070 acc: 0 loss: 1.6636 grad: 1.55e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6142 data: 0.0645 lr: 6.69e-05 mem: 47% pow: 649.517 W 0: INFO 26-04-29 03:19:34.101650 - 2:02:02 - step: 5080 acc: 0 loss: 1.8412 grad: 1.55e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6167 data: 0.0722 lr: 6.68e-05 mem: 47% pow: 651.397 W 0: INFO 26-04-29 03:19:47.552885 - 2:02:16 - step: 5090 acc: 0 loss: 1.3645 grad: 1.51e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6162 data: 0.0657 lr: 6.68e-05 mem: 47% pow: 655.872 W 0: INFO 26-04-29 03:20:01.140252 - 2:02:29 - step: 5100 acc: 0 loss: 1.5215 grad: 1.58e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6599 data: 0.0692 lr: 6.68e-05 mem: 47% pow: 632.882 W 0: INFO 26-04-29 03:20:18.275667 - 2:02:46 - step: 5110 acc: 0 loss: 1.5806 grad: 1.55e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6392 data: 0.0643 lr: 6.68e-05 mem: 54% pow: 653.623 W 0: INFO 26-04-29 03:20:31.937838 - 2:03:00 - step: 5120 acc: 0 loss: 1.5144 grad: 1.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6579 data: 0.0877 lr: 6.68e-05 mem: 47% pow: 620.923 W 0: INFO 26-04-29 03:20:45.892322 - 2:03:14 - step: 5130 acc: 0 loss: 1.5268 grad: 1.80e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.624 data: 0.0711 lr: 6.68e-05 mem: 47% pow: 654.172 W 0: INFO 26-04-29 03:20:59.672061 - 2:03:28 - step: 5140 acc: 0 loss: 1.4272 grad: 1.65e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6251 data: 0.0694 lr: 6.68e-05 mem: 47% pow: 644.824 W 0: INFO 26-04-29 03:21:13.363420 - 2:03:41 - step: 5150 acc: 0 loss: 1.5559 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6199 data: 0.0701 lr: 6.67e-05 mem: 47% pow: 665.614 W 0: INFO 26-04-29 03:21:27.122939 - 2:03:55 - step: 5160 acc: 0 loss: 1.6831 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6431 data: 0.0656 lr: 6.67e-05 mem: 47% pow: 649.652 W 0: INFO 26-04-29 03:21:41.131225 - 2:04:09 - step: 5170 acc: 0 loss: 1.4266 grad: 1.63e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5877 data: 0.0939 lr: 6.67e-05 mem: 47% pow: 652.814 W 0: INFO 26-04-29 03:21:54.560019 - 2:04:23 - step: 5180 acc: 0 loss: 1.4431 grad: 1.77e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6217 data: 0.068 lr: 6.67e-05 mem: 47% pow: 650.978 W 0: INFO 26-04-29 03:22:08.582179 - 2:04:37 - step: 5190 acc: 0 loss: 1.5206 grad: 1.67e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6365 data: 0.054 lr: 6.67e-05 mem: 47% pow: 656.519 W 0: INFO 26-04-29 03:22:22.206968 - 2:04:50 - step: 5200 acc: 0 loss: 1.8249 grad: 1.89e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6219 data: 0.0679 lr: 6.67e-05 mem: 47% pow: 671.564 W 0: INFO 26-04-29 03:22:38.801551 - 2:05:07 - step: 5210 acc: 0 loss: 1.3026 grad: 1.55e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6168 data: 0.0709 lr: 6.66e-05 mem: 54% pow: 654.627 W 0: INFO 26-04-29 03:22:52.153795 - 2:05:20 - step: 5220 acc: 0 loss: 1.8254 grad: 1.51e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6267 data: 0.0739 lr: 6.66e-05 mem: 47% pow: 635.606 W 0: INFO 26-04-29 03:23:05.672610 - 2:05:34 - step: 5230 acc: 0 loss: 1.8692 grad: 1.74e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.73 data: 0.0249 lr: 6.66e-05 mem: 47% pow: 613.597 W 0: INFO 26-04-29 03:23:19.198997 - 2:05:47 - step: 5240 acc: 0 loss: 1.4804 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6084 data: 0.0688 lr: 6.66e-05 mem: 47% pow: 656.225 W 0: INFO 26-04-29 03:23:33.301351 - 2:06:01 - step: 5250 acc: 0 loss: 1.7284 grad: 1.61e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6474 data: 0.0534 lr: 6.66e-05 mem: 47% pow: 660.015 W 0: INFO 26-04-29 03:23:47.279675 - 2:06:15 - step: 5260 acc: 0 loss: 1.6145 grad: 1.77e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.618 data: 0.0703 lr: 6.66e-05 mem: 47% pow: 660.257 W 0: INFO 26-04-29 03:24:00.980944 - 2:06:29 - step: 5270 acc: 0 loss: 1.3501 grad: 1.65e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6198 data: 0.0703 lr: 6.66e-05 mem: 47% pow: 657.357 W 0: INFO 26-04-29 03:24:14.807615 - 2:06:43 - step: 5280 acc: 0 loss: 1.6442 grad: 1.62e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.641 data: 0.0682 lr: 6.65e-05 mem: 47% pow: 639.225 W 0: INFO 26-04-29 03:24:28.413216 - 2:06:56 - step: 5290 acc: 0 loss: 1.672 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6026 data: 0.0803 lr: 6.65e-05 mem: 47% pow: 652.733 W 0: INFO 26-04-29 03:24:42.133633 - 2:07:10 - step: 5300 acc: 0 loss: 1.4218 grad: 1.62e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7007 data: 0.0725 lr: 6.65e-05 mem: 47% pow: 608.353 W 0: INFO 26-04-29 03:24:58.608778 - 2:07:27 - step: 5310 acc: 0 loss: 1.3585 grad: 1.62e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6077 data: 0.0688 lr: 6.65e-05 mem: 54% pow: 656.074 W 0: INFO 26-04-29 03:25:12.213737 - 2:07:40 - step: 5320 acc: 0 loss: 1.7933 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5885 data: 0.1159 lr: 6.65e-05 mem: 47% pow: 638.047 W 0: INFO 26-04-29 03:25:25.987442 - 2:07:54 - step: 5330 acc: 0 loss: 1.4529 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6089 data: 0.0688 lr: 6.65e-05 mem: 47% pow: 657.484 W 0: INFO 26-04-29 03:25:39.512610 - 2:08:08 - step: 5340 acc: 0 loss: 1.6288 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6166 data: 0.0748 lr: 6.65e-05 mem: 47% pow: 662.293 W 0: INFO 26-04-29 03:25:53.103991 - 2:08:21 - step: 5350 acc: 0 loss: 1.3721 grad: 1.72e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6065 data: 0.0782 lr: 6.64e-05 mem: 47% pow: 651.651 W 0: INFO 26-04-29 03:26:06.620226 - 2:08:35 - step: 5360 acc: 0 loss: 1.5216 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6194 data: 0.0704 lr: 6.64e-05 mem: 47% pow: 660.371 W 0: INFO 26-04-29 03:26:20.208952 - 2:08:48 - step: 5370 acc: 0 loss: 1.6089 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6246 data: 0.0745 lr: 6.64e-05 mem: 47% pow: 642.005 W 0: INFO 26-04-29 03:26:33.881680 - 2:09:02 - step: 5380 acc: 0 loss: 1.4473 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6677 data: 0.0632 lr: 6.64e-05 mem: 47% pow: 622.181 W 0: INFO 26-04-29 03:26:48.488537 - 2:09:17 - step: 5390 acc: 0 loss: 1.363 grad: 1.52e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6363 data: 0.0681 lr: 6.64e-05 mem: 47% pow: 648.419 W 0: INFO 26-04-29 03:27:02.361217 - 2:09:30 - step: 5400 acc: 0 loss: 1.4099 grad: 1.84e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6198 data: 0.069 lr: 6.64e-05 mem: 47% pow: 657.564 W 0: INFO 26-04-29 03:27:19.031816 - 2:09:47 - step: 5410 acc: 0 loss: 1.6572 grad: 1.64e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6249 data: 0.0714 lr: 6.64e-05 mem: 54% pow: 641.522 W 0: INFO 26-04-29 03:27:32.629196 - 2:10:01 - step: 5420 acc: 0 loss: 1.4374 grad: 1.79e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6143 data: 0.0711 lr: 6.63e-05 mem: 47% pow: 652.389 W 0: INFO 26-04-29 03:27:46.405782 - 2:10:14 - step: 5430 acc: 0 loss: 1.2673 grad: 1.59e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.689 data: 0.0666 lr: 6.63e-05 mem: 47% pow: 606.434 W 0: INFO 26-04-29 03:27:59.940619 - 2:10:28 - step: 5440 acc: 0 loss: 1.518 grad: 1.71e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.62 data: 0.0697 lr: 6.63e-05 mem: 47% pow: 666.246 W 0: INFO 26-04-29 03:28:13.820959 - 2:10:42 - step: 5450 acc: 0 loss: 1.6041 grad: 1.56e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6282 data: 0.0438 lr: 6.63e-05 mem: 47% pow: 660.872 W 0: INFO 26-04-29 03:28:27.203000 - 2:10:55 - step: 5460 acc: 0 loss: 1.4075 grad: 1.53e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6299 data: 0.0641 lr: 6.63e-05 mem: 47% pow: 650.355 W 0: INFO 26-04-29 03:28:40.698029 - 2:11:09 - step: 5470 acc: 0 loss: 1.7646 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6242 data: 0.0634 lr: 6.63e-05 mem: 47% pow: 655.514 W 0: INFO 26-04-29 03:28:54.609577 - 2:11:23 - step: 5480 acc: 0 loss: 1.5568 grad: 1.67e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6237 data: 0.0651 lr: 6.62e-05 mem: 47% pow: 655.764 W 0: INFO 26-04-29 03:29:08.077819 - 2:11:36 - step: 5490 acc: 0 loss: 1.5903 grad: 1.53e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6073 data: 0.0687 lr: 6.62e-05 mem: 47% pow: 659.002 W 0: INFO 26-04-29 03:29:21.689467 - 2:11:50 - step: 5500 acc: 0 loss: 1.6048 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6039 data: 0.0764 lr: 6.62e-05 mem: 47% pow: 655.211 W 0: INFO 26-04-29 03:29:38.190235 - 2:12:06 - step: 5510 acc: 0 loss: 1.4184 grad: 1.64e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6197 data: 0.0684 lr: 6.62e-05 mem: 54% pow: 647.439 W 0: INFO 26-04-29 03:29:51.847560 - 2:12:20 - step: 5520 acc: 0 loss: 1.5826 grad: 1.58e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6131 data: 0.0642 lr: 6.62e-05 mem: 47% pow: 651.194 W 0: INFO 26-04-29 03:30:05.371735 - 2:12:33 - step: 5530 acc: 0 loss: 1.5909 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6636 data: 0.0551 lr: 6.62e-05 mem: 47% pow: 629.207 W 0: INFO 26-04-29 03:30:18.849727 - 2:12:47 - step: 5540 acc: 0 loss: 1.1915 grad: 1.59e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6243 data: 0.0763 lr: 6.62e-05 mem: 47% pow: 642.735 W 0: INFO 26-04-29 03:30:32.434686 - 2:13:01 - step: 5550 acc: 0 loss: 1.5188 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6103 data: 0.0719 lr: 6.61e-05 mem: 47% pow: 652.181 W 0: INFO 26-04-29 03:30:46.064128 - 2:13:14 - step: 5560 acc: 0 loss: 1.3817 grad: 1.61e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5981 data: 0.0744 lr: 6.61e-05 mem: 47% pow: 655.448 W 0: INFO 26-04-29 03:30:59.665743 - 2:13:28 - step: 5570 acc: 0 loss: 1.3962 grad: 1.65e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6003 data: 0.0714 lr: 6.61e-05 mem: 47% pow: 665.042 W 0: INFO 26-04-29 03:31:13.199421 - 2:13:41 - step: 5580 acc: 0 loss: 1.5973 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6882 data: 0.0602 lr: 6.61e-05 mem: 47% pow: 612.36 W 0: INFO 26-04-29 03:31:26.682823 - 2:13:55 - step: 5590 acc: 0 loss: 1.7391 grad: 1.66e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6113 data: 0.0668 lr: 6.61e-05 mem: 47% pow: 654.805 W 0: INFO 26-04-29 03:31:40.321163 - 2:14:08 - step: 5600 acc: 0 loss: 1.8569 grad: 1.58e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6785 data: 0.0607 lr: 6.61e-05 mem: 47% pow: 618.733 W 0: INFO 26-04-29 03:31:56.805906 - 2:14:25 - step: 5610 acc: 0 loss: 1.2832 grad: 1.53e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5843 data: 0.1025 lr: 6.61e-05 mem: 54% pow: 651.269 W 0: INFO 26-04-29 03:32:10.625288 - 2:14:39 - step: 5620 acc: 0 loss: 1.6423 grad: 1.52e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6001 data: 0.0773 lr: 6.60e-05 mem: 47% pow: 656.196 W 0: INFO 26-04-29 03:32:24.206816 - 2:14:52 - step: 5630 acc: 0 loss: 1.6935 grad: 1.75e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6102 data: 0.0669 lr: 6.60e-05 mem: 47% pow: 656.321 W 0: INFO 26-04-29 03:32:38.040511 - 2:15:06 - step: 5640 acc: 0 loss: 1.7292 grad: 1.93e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6172 data: 0.0749 lr: 6.60e-05 mem: 47% pow: 643.243 W 0: INFO 26-04-29 03:32:51.707419 - 2:15:20 - step: 5650 acc: 0 loss: 1.658 grad: 1.77e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6209 data: 0.0776 lr: 6.60e-05 mem: 47% pow: 640.942 W 0: INFO 26-04-29 03:33:05.441046 - 2:15:34 - step: 5660 acc: 0 loss: 1.6346 grad: 1.64e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6217 data: 0.0694 lr: 6.60e-05 mem: 47% pow: 656.298 W 0: INFO 26-04-29 03:33:18.959247 - 2:15:47 - step: 5670 acc: 0 loss: 1.4679 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6116 data: 0.0721 lr: 6.60e-05 mem: 47% pow: 653.846 W 0: INFO 26-04-29 03:33:32.642926 - 2:16:01 - step: 5680 acc: 0 loss: 1.5265 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6159 data: 0.0701 lr: 6.59e-05 mem: 47% pow: 653.245 W 0: INFO 26-04-29 03:33:46.095131 - 2:16:14 - step: 5690 acc: 0 loss: 1.7132 grad: 1.87e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6368 data: 0.0624 lr: 6.59e-05 mem: 47% pow: 637.853 W 0: INFO 26-04-29 03:34:00.165534 - 2:16:28 - step: 5700 acc: 0 loss: 1.6939 grad: 1.73e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6355 data: 0.0645 lr: 6.59e-05 mem: 47% pow: 649.091 W 0: INFO 26-04-29 03:34:16.718445 - 2:16:45 - step: 5710 acc: 0 loss: 1.5727 grad: 1.83e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6127 data: 0.0755 lr: 6.59e-05 mem: 54% pow: 660.614 W 0: INFO 26-04-29 03:34:30.281530 - 2:16:58 - step: 5720 acc: 0 loss: 1.5492 grad: 1.91e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6262 data: 0.0661 lr: 6.59e-05 mem: 47% pow: 642.216 W 0: INFO 26-04-29 03:34:44.102084 - 2:17:12 - step: 5730 acc: 0 loss: 1.5274 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5987 data: 0.0751 lr: 6.59e-05 mem: 47% pow: 651.772 W 0: INFO 26-04-29 03:34:58.001602 - 2:17:26 - step: 5740 acc: 0 loss: 1.5965 grad: 1.70e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.613 data: 0.0607 lr: 6.59e-05 mem: 47% pow: 662.979 W 0: INFO 26-04-29 03:35:11.951219 - 2:17:40 - step: 5750 acc: 0 loss: 1.7114 grad: 1.84e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7853 data: 0.1036 lr: 6.58e-05 mem: 47% pow: 530.89 W 0: INFO 26-04-29 03:35:25.662310 - 2:17:54 - step: 5760 acc: 0 loss: 1.6126 grad: 1.71e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5765 data: 0.0945 lr: 6.58e-05 mem: 47% pow: 671.322 W 0: INFO 26-04-29 03:35:39.128283 - 2:18:07 - step: 5770 acc: 0 loss: 1.4605 grad: 1.50e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.658 data: 0.0761 lr: 6.58e-05 mem: 47% pow: 617.931 W 0: INFO 26-04-29 03:35:53.254806 - 2:18:21 - step: 5780 acc: 0 loss: 1.3998 grad: 1.73e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6256 data: 0.0716 lr: 6.58e-05 mem: 47% pow: 645.951 W 0: INFO 26-04-29 03:36:07.017832 - 2:18:35 - step: 5790 acc: 0 loss: 1.621 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6053 data: 0.0824 lr: 6.58e-05 mem: 47% pow: 658.095 W 0: INFO 26-04-29 03:36:20.704568 - 2:18:49 - step: 5800 acc: 0 loss: 1.4159 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.727 data: 0.0442 lr: 6.58e-05 mem: 47% pow: 603.965 W 0: INFO 26-04-29 03:36:37.377360 - 2:19:05 - step: 5810 acc: 0 loss: 1.8923 grad: 1.60e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6167 data: 0.0719 lr: 6.58e-05 mem: 54% pow: 656.789 W 0: INFO 26-04-29 03:36:50.970645 - 2:19:19 - step: 5820 acc: 0 loss: 1.6693 grad: 1.54e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6386 data: 0.0612 lr: 6.57e-05 mem: 47% pow: 640.979 W 0: INFO 26-04-29 03:37:04.722205 - 2:19:33 - step: 5830 acc: 0 loss: 1.6495 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.602 data: 0.075 lr: 6.57e-05 mem: 47% pow: 657.265 W 0: INFO 26-04-29 03:37:18.642460 - 2:19:47 - step: 5840 acc: 0 loss: 1.8285 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6216 data: 0.0685 lr: 6.57e-05 mem: 47% pow: 648.013 W 0: INFO 26-04-29 03:37:32.237784 - 2:20:00 - step: 5850 acc: 0 loss: 1.4679 grad: 1.63e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6076 data: 0.0762 lr: 6.57e-05 mem: 47% pow: 652.411 W 0: INFO 26-04-29 03:37:45.828314 - 2:20:14 - step: 5860 acc: 0 loss: 1.6524 grad: 1.71e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6302 data: 0.0696 lr: 6.57e-05 mem: 47% pow: 643.316 W 0: INFO 26-04-29 03:37:59.465457 - 2:20:28 - step: 5870 acc: 0 loss: 1.5606 grad: 1.58e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6438 data: 0.0566 lr: 6.57e-05 mem: 47% pow: 651.892 W 0: INFO 26-04-29 03:38:13.039920 - 2:20:41 - step: 5880 acc: 0 loss: 1.2468 grad: 1.90e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6269 data: 0.0637 lr: 6.57e-05 mem: 47% pow: 653.16 W 0: INFO 26-04-29 03:38:26.750678 - 2:20:55 - step: 5890 acc: 0 loss: 1.5574 grad: 1.78e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6112 data: 0.0718 lr: 6.56e-05 mem: 47% pow: 658.327 W 0: INFO 26-04-29 03:38:40.330340 - 2:21:08 - step: 5900 acc: 0 loss: 1.6332 grad: 1.60e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6152 data: 0.0667 lr: 6.56e-05 mem: 47% pow: 654.723 W 0: INFO 26-04-29 03:38:56.888163 - 2:21:25 - step: 5910 acc: 0 loss: 1.3559 grad: 1.73e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6901 data: 0.0692 lr: 6.56e-05 mem: 54% pow: 609.063 W 0: INFO 26-04-29 03:39:10.384355 - 2:21:38 - step: 5920 acc: 0 loss: 1.7482 grad: 1.63e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6479 data: 0.0685 lr: 6.56e-05 mem: 47% pow: 635.903 W 0: INFO 26-04-29 03:39:24.147544 - 2:21:52 - step: 5930 acc: 0 loss: 1.5584 grad: 1.57e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6196 data: 0.0697 lr: 6.56e-05 mem: 47% pow: 604.071 W 0: INFO 26-04-29 03:39:37.906345 - 2:22:06 - step: 5940 acc: 0 loss: 1.5983 grad: 1.79e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6144 data: 0.0622 lr: 6.56e-05 mem: 47% pow: 654.085 W 0: INFO 26-04-29 03:39:51.345837 - 2:22:19 - step: 5950 acc: 0 loss: 1.8693 grad: 1.67e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.619 data: 0.0794 lr: 6.55e-05 mem: 47% pow: 643.105 W 0: INFO 26-04-29 03:40:04.839720 - 2:22:33 - step: 5960 acc: 0 loss: 1.8859 grad: 1.67e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6126 data: 0.0917 lr: 6.55e-05 mem: 47% pow: 642.549 W 0: INFO 26-04-29 03:40:18.305719 - 2:22:46 - step: 5970 acc: 0 loss: 1.8245 grad: 1.64e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6238 data: 0.0736 lr: 6.55e-05 mem: 47% pow: 637.344 W 0: INFO 26-04-29 03:40:31.823789 - 2:23:00 - step: 5980 acc: 0 loss: 1.6007 grad: 1.60e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6091 data: 0.0677 lr: 6.55e-05 mem: 47% pow: 660.694 W 0: INFO 26-04-29 03:40:45.234140 - 2:23:13 - step: 5990 acc: 0 loss: 1.7805 grad: 1.54e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5976 data: 0.1019 lr: 6.55e-05 mem: 47% pow: 645.058 W 0: INFO 26-04-29 03:40:58.685744 - 2:23:27 - step: 6000 acc: 0 loss: 1.5954 grad: 1.89e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6105 data: 0.0686 lr: 6.55e-05 mem: 47% pow: 658.374 W 0: INFO 26-04-29 03:41:02.355451 - 2:23:30 - garbage collection 0: INFO 26-04-29 03:41:16.919243 - 2:23:45 - step: 6010 acc: 0 loss: 1.6174 grad: 1.67e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.6352 data: 0.0742 lr: 6.55e-05 mem: 54% pow: 639.574 W 0: INFO 26-04-29 03:41:30.545426 - 2:23:59 - step: 6020 acc: 0 loss: 1.8436 grad: 1.56e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.616 data: 0.0748 lr: 6.54e-05 mem: 47% pow: 648.905 W 0: INFO 26-04-29 03:41:44.051636 - 2:24:12 - step: 6030 acc: 0 loss: 2.0523 grad: 1.72e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6099 data: 0.068 lr: 6.54e-05 mem: 47% pow: 652.004 W 0: INFO 26-04-29 03:41:58.265102 - 2:24:26 - step: 6040 acc: 0 loss: 1.8204 grad: 1.71e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.7247 data: 0.0716 lr: 6.54e-05 mem: 47% pow: 604.048 W 0: INFO 26-04-29 03:42:11.667743 - 2:24:40 - step: 6050 acc: 0 loss: 1.8272 grad: 1.64e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.6135 data: 0.0753 lr: 6.54e-05 mem: 47% pow: 669.223 W 0: INFO 26-04-29 03:42:25.326780 - 2:24:53 - step: 6060 acc: 0 loss: 1.4658 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6317 data: 0.0672 lr: 6.54e-05 mem: 47% pow: 669.956 W 0: INFO 26-04-29 03:42:38.878034 - 2:25:07 - step: 6070 acc: 0 loss: 1.7567 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6345 data: 0.0728 lr: 6.54e-05 mem: 47% pow: 656.106 W 0: INFO 26-04-29 03:42:52.526822 - 2:25:21 - step: 6080 acc: 0 loss: 1.7361 grad: 1.63e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6056 data: 0.0687 lr: 6.54e-05 mem: 47% pow: 670.154 W 0: INFO 26-04-29 03:43:06.027425 - 2:25:34 - step: 6090 acc: 0 loss: 1.8353 grad: 1.71e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6027 data: 0.0771 lr: 6.53e-05 mem: 47% pow: 650.775 W 0: INFO 26-04-29 03:43:19.641122 - 2:25:48 - step: 6100 acc: 0 loss: 1.7266 grad: 1.71e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6211 data: 0.0691 lr: 6.53e-05 mem: 47% pow: 644.543 W 0: INFO 26-04-29 03:43:36.245971 - 2:26:04 - step: 6110 acc: 0 loss: 1.4944 grad: 1.59e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6225 data: 0.0724 lr: 6.53e-05 mem: 54% pow: 639.921 W 0: INFO 26-04-29 03:43:49.723978 - 2:26:18 - step: 6120 acc: 0 loss: 1.4759 grad: 1.54e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6281 data: 0.0627 lr: 6.53e-05 mem: 47% pow: 659.597 W 0: INFO 26-04-29 03:44:03.354498 - 2:26:31 - step: 6130 acc: 0 loss: 1.372 grad: 1.63e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6232 data: 0.0586 lr: 6.53e-05 mem: 47% pow: 652.289 W 0: INFO 26-04-29 03:44:16.814726 - 2:26:45 - step: 6140 acc: 0 loss: 1.7143 grad: 1.75e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6123 data: 0.0676 lr: 6.53e-05 mem: 47% pow: 655.846 W 0: INFO 26-04-29 03:44:30.743441 - 2:26:59 - step: 6150 acc: 0 loss: 1.8766 grad: 1.55e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6258 data: 0.0648 lr: 6.53e-05 mem: 47% pow: 655.772 W 0: INFO 26-04-29 03:44:44.549985 - 2:27:13 - step: 6160 acc: 0 loss: 1.6406 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6095 data: 0.0707 lr: 6.52e-05 mem: 47% pow: 651.916 W 0: INFO 26-04-29 03:44:57.978659 - 2:27:26 - step: 6170 acc: 0 loss: 1.7834 grad: 1.60e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6019 data: 0.0704 lr: 6.52e-05 mem: 47% pow: 658.649 W 0: INFO 26-04-29 03:45:11.549725 - 2:27:40 - step: 6180 acc: 0 loss: 1.3773 grad: 1.48e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6295 data: 0.0716 lr: 6.52e-05 mem: 47% pow: 649.727 W 0: INFO 26-04-29 03:45:25.091698 - 2:27:53 - step: 6190 acc: 0 loss: 1.8082 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6135 data: 0.0918 lr: 6.52e-05 mem: 47% pow: 648.193 W 0: INFO 26-04-29 03:45:38.679713 - 2:28:07 - step: 6200 acc: 0 loss: 1.703 grad: 1.49e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6066 data: 0.0774 lr: 6.52e-05 mem: 47% pow: 654.027 W 0: INFO 26-04-29 03:45:55.364548 - 2:28:23 - step: 6210 acc: 0 loss: 1.7705 grad: 1.52e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6277 data: 0.0639 lr: 6.52e-05 mem: 54% pow: 653.807 W 0: INFO 26-04-29 03:46:09.008269 - 2:28:37 - step: 6220 acc: 0 loss: 1.2701 grad: 1.54e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.614 data: 0.078 lr: 6.51e-05 mem: 47% pow: 649.164 W 0: INFO 26-04-29 03:46:22.756567 - 2:28:51 - step: 6230 acc: 0 loss: 2.0833 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6015 data: 0.0782 lr: 6.51e-05 mem: 47% pow: 654.431 W 0: INFO 26-04-29 03:46:36.536376 - 2:29:05 - step: 6240 acc: 0 loss: 1.5705 grad: 1.59e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6404 data: 0.0498 lr: 6.51e-05 mem: 47% pow: 653.059 W 0: INFO 26-04-29 03:46:50.054485 - 2:29:18 - step: 6250 acc: 0 loss: 1.5288 grad: 1.59e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6001 data: 0.0857 lr: 6.51e-05 mem: 47% pow: 652.325 W 0: INFO 26-04-29 03:47:03.688886 - 2:29:32 - step: 6260 acc: 0 loss: 1.6745 grad: 1.58e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6082 data: 0.0715 lr: 6.51e-05 mem: 47% pow: 656.867 W 0: INFO 26-04-29 03:47:17.467241 - 2:29:46 - step: 6270 acc: 0 loss: 1.7521 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7313 data: 0.066 lr: 6.51e-05 mem: 47% pow: 590.468 W 0: INFO 26-04-29 03:47:31.420202 - 2:30:00 - step: 6280 acc: 0 loss: 1.4844 grad: 1.61e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7204 data: 0.0709 lr: 6.51e-05 mem: 47% pow: 589.173 W 0: INFO 26-04-29 03:47:45.004241 - 2:30:13 - step: 6290 acc: 0 loss: 1.6901 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6371 data: 0.072 lr: 6.50e-05 mem: 47% pow: 652.141 W 0: INFO 26-04-29 03:47:58.485759 - 2:30:27 - step: 6300 acc: 0 loss: 1.8212 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6301 data: 0.0639 lr: 6.50e-05 mem: 47% pow: 643.302 W 0: INFO 26-04-29 03:48:15.016079 - 2:30:43 - step: 6310 acc: 0 loss: 1.5115 grad: 1.63e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6155 data: 0.0623 lr: 6.50e-05 mem: 54% pow: 655.622 W 0: INFO 26-04-29 03:48:28.659355 - 2:30:57 - step: 6320 acc: 0 loss: 1.7336 grad: 1.60e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6102 data: 0.0766 lr: 6.50e-05 mem: 47% pow: 658.739 W 0: INFO 26-04-29 03:48:42.295500 - 2:31:10 - step: 6330 acc: 0 loss: 1.8018 grad: 4.38e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6227 data: 0.0659 lr: 6.50e-05 mem: 47% pow: 653.927 W 0: INFO 26-04-29 03:48:55.775619 - 2:31:24 - step: 6340 acc: 0 loss: 1.5546 grad: 1.57e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6446 data: 0.0596 lr: 6.50e-05 mem: 47% pow: 657.17 W 0: INFO 26-04-29 03:49:09.814147 - 2:31:38 - step: 6350 acc: 0 loss: 1.415 grad: 1.67e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6349 data: 0.0686 lr: 6.50e-05 mem: 47% pow: 666.02 W 0: INFO 26-04-29 03:49:23.303795 - 2:31:51 - step: 6360 acc: 0 loss: 1.8595 grad: 1.48e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6265 data: 0.0598 lr: 6.49e-05 mem: 47% pow: 657.35 W 0: INFO 26-04-29 03:49:37.080465 - 2:32:05 - step: 6370 acc: 0 loss: 1.382 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6287 data: 0.0659 lr: 6.49e-05 mem: 47% pow: 645.426 W 0: INFO 26-04-29 03:49:50.885557 - 2:32:19 - step: 6380 acc: 0 loss: 1.5843 grad: 1.73e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6258 data: 0.0798 lr: 6.49e-05 mem: 47% pow: 656.337 W 0: INFO 26-04-29 03:50:04.950664 - 2:32:33 - step: 6390 acc: 0 loss: 1.7576 grad: 1.49e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6665 data: 0.0727 lr: 6.49e-05 mem: 47% pow: 615.13 W 0: INFO 26-04-29 03:50:18.532272 - 2:32:47 - step: 6400 acc: 0 loss: 1.4603 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6221 data: 0.0635 lr: 6.49e-05 mem: 47% pow: 646.55 W 0: INFO 26-04-29 03:50:35.375165 - 2:33:03 - step: 6410 acc: 0 loss: 2.3214 grad: 1.59e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6084 data: 0.0717 lr: 6.49e-05 mem: 54% pow: 655.344 W 0: INFO 26-04-29 03:50:49.029619 - 2:33:17 - step: 6420 acc: 0 loss: 1.5243 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6118 data: 0.0715 lr: 6.48e-05 mem: 47% pow: 648.242 W 0: INFO 26-04-29 03:51:02.735283 - 2:33:31 - step: 6430 acc: 0 loss: 1.6396 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6124 data: 0.0706 lr: 6.48e-05 mem: 47% pow: 648.962 W 0: INFO 26-04-29 03:51:16.654649 - 2:33:45 - step: 6440 acc: 0 loss: 1.6022 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6234 data: 0.0634 lr: 6.48e-05 mem: 47% pow: 664.004 W 0: INFO 26-04-29 03:51:30.559581 - 2:33:59 - step: 6450 acc: 0 loss: 1.3144 grad: 1.49e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6168 data: 0.0704 lr: 6.48e-05 mem: 47% pow: 651.725 W 0: INFO 26-04-29 03:51:44.301440 - 2:34:12 - step: 6460 acc: 0 loss: 1.3635 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6027 data: 0.0713 lr: 6.48e-05 mem: 47% pow: 665.78 W 0: INFO 26-04-29 03:51:58.317523 - 2:34:26 - step: 6470 acc: 0 loss: 1.8851 grad: 1.53e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6803 data: 0.0511 lr: 6.48e-05 mem: 47% pow: 624.887 W 0: INFO 26-04-29 03:52:12.227977 - 2:34:40 - step: 6480 acc: 0 loss: 1.8815 grad: 1.55e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.7177 data: 0.065 lr: 6.48e-05 mem: 47% pow: 595.114 W 0: INFO 26-04-29 03:52:26.096035 - 2:34:54 - step: 6490 acc: 0 loss: 1.6764 grad: 1.58e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6766 data: 0.0752 lr: 6.47e-05 mem: 47% pow: 622.559 W 0: INFO 26-04-29 03:52:40.136290 - 2:35:08 - step: 6500 acc: 0 loss: 1.4731 grad: 1.58e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6477 data: 0.0732 lr: 6.47e-05 mem: 47% pow: 626.892 W 0: INFO 26-04-29 03:52:56.775968 - 2:35:25 - step: 6510 acc: 0 loss: 1.5637 grad: 1.63e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6315 data: 0.0586 lr: 6.47e-05 mem: 54% pow: 657.045 W 0: INFO 26-04-29 03:53:16.559749 - 2:35:45 - step: 6520 acc: 0 loss: 1.8173 grad: 1.68e-01 flops: 2.86e+14 wps: 3.32e+04 iter: 0.647 data: 0.0831 lr: 6.47e-05 mem: 47% pow: 631.601 W 0: INFO 26-04-29 03:53:31.246759 - 2:35:59 - step: 6530 acc: 0 loss: 1.6343 grad: 1.73e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6324 data: 0.0733 lr: 6.47e-05 mem: 47% pow: 646.198 W 0: INFO 26-04-29 03:53:45.316591 - 2:36:13 - step: 6540 acc: 0 loss: 1.7226 grad: 1.60e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.7799 data: 0.0742 lr: 6.47e-05 mem: 47% pow: 557.001 W 0: INFO 26-04-29 03:53:59.225693 - 2:36:27 - step: 6550 acc: 0 loss: 1.9042 grad: 1.64e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6002 data: 0.068 lr: 6.47e-05 mem: 47% pow: 674.559 W 0: INFO 26-04-29 03:54:13.100519 - 2:36:41 - step: 6560 acc: 0 loss: 1.6742 grad: 1.47e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.646 data: 0.0689 lr: 6.46e-05 mem: 47% pow: 631.466 W 0: INFO 26-04-29 03:54:26.911357 - 2:36:55 - step: 6570 acc: 0 loss: 1.2994 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6066 data: 0.0728 lr: 6.46e-05 mem: 47% pow: 659.534 W 0: INFO 26-04-29 03:54:40.581065 - 2:37:09 - step: 6580 acc: 0 loss: 1.4328 grad: 1.60e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.637 data: 0.0783 lr: 6.46e-05 mem: 47% pow: 633.996 W 0: INFO 26-04-29 03:54:54.467495 - 2:37:23 - step: 6590 acc: 0 loss: 1.9691 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6237 data: 0.0745 lr: 6.46e-05 mem: 47% pow: 640.413 W 0: INFO 26-04-29 03:55:08.374376 - 2:37:36 - step: 6600 acc: 0 loss: 1.7141 grad: 1.74e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6134 data: 0.0672 lr: 6.46e-05 mem: 47% pow: 654.444 W 0: INFO 26-04-29 03:55:25.044648 - 2:37:53 - step: 6610 acc: 0 loss: 1.9203 grad: 1.61e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6277 data: 0.0638 lr: 6.46e-05 mem: 54% pow: 652.956 W 0: INFO 26-04-29 03:55:38.724029 - 2:38:07 - step: 6620 acc: 0 loss: 1.5574 grad: 1.68e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5937 data: 0.0802 lr: 6.46e-05 mem: 47% pow: 669.867 W 0: INFO 26-04-29 03:55:52.619701 - 2:38:21 - step: 6630 acc: 0 loss: 1.699 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6272 data: 0.076 lr: 6.45e-05 mem: 47% pow: 645.272 W 0: INFO 26-04-29 03:56:06.831328 - 2:38:35 - step: 6640 acc: 0 loss: 1.5959 grad: 1.47e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.626 data: 0.0761 lr: 6.45e-05 mem: 47% pow: 645.949 W 0: INFO 26-04-29 03:56:20.874376 - 2:38:49 - step: 6650 acc: 0 loss: 1.4737 grad: 1.55e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6168 data: 0.0711 lr: 6.45e-05 mem: 47% pow: 654.235 W 0: INFO 26-04-29 03:56:34.984777 - 2:39:03 - step: 6660 acc: 0 loss: 1.6629 grad: 1.60e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6246 data: 0.0695 lr: 6.45e-05 mem: 47% pow: 647.927 W 0: INFO 26-04-29 03:56:49.068200 - 2:39:17 - step: 6670 acc: 0 loss: 1.6339 grad: 1.57e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6149 data: 0.0674 lr: 6.45e-05 mem: 47% pow: 651.574 W 0: INFO 26-04-29 03:57:02.827510 - 2:39:31 - step: 6680 acc: 0 loss: 1.8115 grad: 1.67e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5849 data: 0.0942 lr: 6.45e-05 mem: 47% pow: 654.949 W 0: INFO 26-04-29 03:57:16.653275 - 2:39:45 - step: 6690 acc: 0 loss: 1.1922 grad: 1.51e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6309 data: 0.0697 lr: 6.44e-05 mem: 47% pow: 641.912 W 0: INFO 26-04-29 03:57:30.424998 - 2:39:59 - step: 6700 acc: 0 loss: 1.6156 grad: 1.75e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6072 data: 0.0673 lr: 6.44e-05 mem: 47% pow: 658.062 W 0: INFO 26-04-29 03:57:47.861229 - 2:40:16 - step: 6710 acc: 0 loss: 1.3743 grad: 1.60e-01 flops: 3.24e+14 wps: 3.76e+04 iter: 0.6421 data: 0.0536 lr: 6.44e-05 mem: 54% pow: 642.031 W 0: INFO 26-04-29 03:58:01.719508 - 2:40:30 - step: 6720 acc: 0 loss: 2.0236 grad: 1.67e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6466 data: 0.0675 lr: 6.44e-05 mem: 47% pow: 645.619 W 0: INFO 26-04-29 03:58:15.589962 - 2:40:44 - step: 6730 acc: 0 loss: 1.6122 grad: 1.63e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6293 data: 0.0692 lr: 6.44e-05 mem: 47% pow: 642.617 W 0: INFO 26-04-29 03:58:29.309546 - 2:40:57 - step: 6740 acc: 0 loss: 1.6886 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5891 data: 0.0967 lr: 6.44e-05 mem: 47% pow: 656.988 W 0: INFO 26-04-29 03:58:43.062607 - 2:41:11 - step: 6750 acc: 0 loss: 1.3823 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.603 data: 0.0683 lr: 6.44e-05 mem: 47% pow: 668.924 W 0: INFO 26-04-29 03:58:59.710216 - 2:41:28 - step: 6760 acc: 0 loss: 1.9447 grad: 1.53e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 3.4772 data: 0.0652 lr: 6.43e-05 mem: 47% pow: 420.811 W 0: INFO 26-04-29 03:59:13.637452 - 2:41:42 - step: 6770 acc: 0 loss: 1.7328 grad: 1.46e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6442 data: 0.0674 lr: 6.43e-05 mem: 47% pow: 640.133 W 0: INFO 26-04-29 03:59:27.277486 - 2:41:55 - step: 6780 acc: 0 loss: 1.7909 grad: 1.65e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6539 data: 0.069 lr: 6.43e-05 mem: 47% pow: 633.864 W 0: INFO 26-04-29 03:59:41.344052 - 2:42:09 - step: 6790 acc: 0 loss: 1.6067 grad: 1.55e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6122 data: 0.0639 lr: 6.43e-05 mem: 47% pow: 659.79 W 0: INFO 26-04-29 03:59:55.018487 - 2:42:23 - step: 6800 acc: 0 loss: 1.3743 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6386 data: 0.0634 lr: 6.43e-05 mem: 47% pow: 643.551 W 0: INFO 26-04-29 04:00:12.115424 - 2:42:40 - step: 6810 acc: 0 loss: 1.86 grad: 1.58e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.9569 data: 0.0027 lr: 6.43e-05 mem: 54% pow: 498.224 W 0: INFO 26-04-29 04:00:26.303750 - 2:42:54 - step: 6820 acc: 0 loss: 1.8577 grad: 1.61e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6056 data: 0.0717 lr: 6.43e-05 mem: 47% pow: 659.952 W 0: INFO 26-04-29 04:00:40.006135 - 2:43:08 - step: 6830 acc: 0 loss: 1.7036 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6304 data: 0.071 lr: 6.42e-05 mem: 47% pow: 641.803 W 0: INFO 26-04-29 04:00:53.601863 - 2:43:22 - step: 6840 acc: 0 loss: 2.0803 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6104 data: 0.0669 lr: 6.42e-05 mem: 47% pow: 656.265 W 0: INFO 26-04-29 04:01:07.536871 - 2:43:36 - step: 6850 acc: 0 loss: 1.8923 grad: 1.66e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6685 data: 0.063 lr: 6.42e-05 mem: 47% pow: 630.501 W 0: INFO 26-04-29 04:01:24.762026 - 2:43:53 - step: 6860 acc: 0 loss: 1.6228 grad: 1.72e-01 flops: 3.28e+14 wps: 3.81e+04 iter: 0.6086 data: 0.0692 lr: 6.42e-05 mem: 47% pow: 656.034 W 0: INFO 26-04-29 04:01:38.853514 - 2:44:07 - step: 6870 acc: 0 loss: 2.0749 grad: 1.54e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6461 data: 0.0716 lr: 6.42e-05 mem: 47% pow: 626.322 W 0: INFO 26-04-29 04:01:52.475660 - 2:44:21 - step: 6880 acc: 0 loss: 1.8682 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6461 data: 0.0557 lr: 6.42e-05 mem: 47% pow: 642.049 W 0: INFO 26-04-29 04:02:06.225722 - 2:44:34 - step: 6890 acc: 0 loss: 1.5589 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6663 data: 0.0646 lr: 6.41e-05 mem: 47% pow: 630.27 W 0: INFO 26-04-29 04:02:20.065958 - 2:44:48 - step: 6900 acc: 0 loss: 1.7002 grad: 1.52e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6158 data: 0.0728 lr: 6.41e-05 mem: 47% pow: 653.185 W 0: INFO 26-04-29 04:02:36.979270 - 2:45:05 - step: 6910 acc: 0 loss: 1.5575 grad: 1.46e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6293 data: 0.0761 lr: 6.41e-05 mem: 54% pow: 649.332 W 0: INFO 26-04-29 04:02:50.768437 - 2:45:19 - step: 6920 acc: 0 loss: 1.8672 grad: 1.56e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6552 data: 0.0663 lr: 6.41e-05 mem: 47% pow: 637.781 W 0: INFO 26-04-29 04:03:06.670047 - 2:45:35 - step: 6930 acc: 0 loss: 1.4548 grad: 1.52e-01 flops: 3.55e+14 wps: 4.12e+04 iter: 2.7524 data: 0.0638 lr: 6.41e-05 mem: 47% pow: 440.36 W 0: INFO 26-04-29 04:03:20.707404 - 2:45:49 - step: 6940 acc: 0 loss: 1.7801 grad: 1.53e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6485 data: 0.0682 lr: 6.41e-05 mem: 47% pow: 644.056 W 0: INFO 26-04-29 04:03:34.361439 - 2:46:02 - step: 6950 acc: 0 loss: 1.2423 grad: 1.61e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6009 data: 0.077 lr: 6.41e-05 mem: 47% pow: 661.03 W 0: INFO 26-04-29 04:03:48.274351 - 2:46:16 - step: 6960 acc: 0 loss: 1.6665 grad: 1.55e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7303 data: 0.0724 lr: 6.40e-05 mem: 47% pow: 594.096 W 0: INFO 26-04-29 04:04:06.049742 - 2:46:34 - step: 6970 acc: 0 loss: 1.6687 grad: 1.59e-01 flops: 3.18e+14 wps: 3.69e+04 iter: 0.6477 data: 0.0797 lr: 6.40e-05 mem: 47% pow: 642.032 W 0: INFO 26-04-29 04:04:24.294417 - 2:46:52 - step: 6980 acc: 0 loss: 1.7309 grad: 1.66e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.6782 data: 0.0667 lr: 6.40e-05 mem: 47% pow: 621.624 W 0: INFO 26-04-29 04:04:38.273926 - 2:47:06 - step: 6990 acc: 0 loss: 1.724 grad: 1.62e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6357 data: 0.0535 lr: 6.40e-05 mem: 47% pow: 656.439 W 0: INFO 26-04-29 04:04:53.201753 - 2:47:21 - step: 7000 acc: 0 loss: 1.5898 grad: 1.64e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.6705 data: 0.0725 lr: 6.40e-05 mem: 47% pow: 615.707 W 0: INFO 26-04-29 04:04:56.907578 - 2:47:25 - garbage collection 0: INFO 26-04-29 04:05:11.466113 - 2:47:40 - step: 7010 acc: 0 loss: 1.6994 grad: 1.62e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.6186 data: 0.0765 lr: 6.40e-05 mem: 54% pow: 646.327 W 0: INFO 26-04-29 04:05:25.611164 - 2:47:54 - step: 7020 acc: 0 loss: 1.4393 grad: 1.82e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.7928 data: 0.066 lr: 6.40e-05 mem: 47% pow: 554.238 W 0: INFO 26-04-29 04:05:40.400316 - 2:48:08 - step: 7030 acc: 0 loss: 1.8209 grad: 1.73e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6157 data: 0.0756 lr: 6.39e-05 mem: 47% pow: 667.744 W 0: INFO 26-04-29 04:05:54.305391 - 2:48:22 - step: 7040 acc: 0 loss: 1.4397 grad: 1.76e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6181 data: 0.0763 lr: 6.39e-05 mem: 47% pow: 644.978 W 0: INFO 26-04-29 04:06:08.146147 - 2:48:36 - step: 7050 acc: 0 loss: 1.669 grad: 1.46e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.632 data: 0.0647 lr: 6.39e-05 mem: 47% pow: 643.551 W 0: INFO 26-04-29 04:06:21.656085 - 2:48:50 - step: 7060 acc: 0 loss: 1.8283 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6132 data: 0.0798 lr: 6.39e-05 mem: 47% pow: 653.296 W 0: INFO 26-04-29 04:06:40.382558 - 2:49:08 - step: 7070 acc: 0 loss: 1.6846 grad: 1.66e-01 flops: 3.02e+14 wps: 3.50e+04 iter: 0.7211 data: 0.0704 lr: 6.39e-05 mem: 47% pow: 590.592 W 0: INFO 26-04-29 04:06:54.357627 - 2:49:22 - step: 7080 acc: 0 loss: 1.4489 grad: 1.76e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7025 data: 0.0655 lr: 6.39e-05 mem: 47% pow: 601.471 W 0: INFO 26-04-29 04:07:08.696739 - 2:49:37 - step: 7090 acc: 0 loss: 1.7944 grad: 1.60e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5915 data: 0.0962 lr: 6.39e-05 mem: 47% pow: 651.621 W 0: INFO 26-04-29 04:07:23.298125 - 2:49:51 - step: 7100 acc: 0 loss: 1.3258 grad: 1.61e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 1.3204 data: 0.0746 lr: 6.38e-05 mem: 47% pow: 465.075 W 0: INFO 26-04-29 04:07:40.360965 - 2:50:08 - step: 7110 acc: 0 loss: 1.4703 grad: 1.79e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.6421 data: 0.0729 lr: 6.38e-05 mem: 54% pow: 633.404 W 0: INFO 26-04-29 04:07:54.269450 - 2:50:22 - step: 7120 acc: 0 loss: 1.6136 grad: 1.68e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6369 data: 0.0492 lr: 6.38e-05 mem: 47% pow: 653.912 W 0: INFO 26-04-29 04:08:09.353446 - 2:50:37 - step: 7130 acc: 0 loss: 1.5043 grad: 1.52e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.612 data: 0.0917 lr: 6.38e-05 mem: 47% pow: 634.867 W 0: INFO 26-04-29 04:08:23.030302 - 2:50:51 - step: 7140 acc: 0 loss: 1.9014 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6509 data: 0.0722 lr: 6.38e-05 mem: 47% pow: 628.03 W 0: INFO 26-04-29 04:08:37.304160 - 2:51:05 - step: 7150 acc: 0 loss: 1.6017 grad: 1.51e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 1.1595 data: 0.0679 lr: 6.38e-05 mem: 47% pow: 419.154 W 0: INFO 26-04-29 04:08:51.646153 - 2:51:20 - step: 7160 acc: 0 loss: 1.6901 grad: 1.51e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6253 data: 0.0735 lr: 6.37e-05 mem: 47% pow: 640.933 W 0: INFO 26-04-29 04:09:05.522058 - 2:51:34 - step: 7170 acc: 0 loss: 1.355 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6054 data: 0.0734 lr: 6.37e-05 mem: 47% pow: 656.872 W 0: INFO 26-04-29 04:09:19.433998 - 2:51:48 - step: 7180 acc: 0 loss: 1.8551 grad: 1.64e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6177 data: 0.0687 lr: 6.37e-05 mem: 47% pow: 646.794 W 0: INFO 26-04-29 04:09:33.351727 - 2:52:01 - step: 7190 acc: 0 loss: 1.5222 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6438 data: 0.0641 lr: 6.37e-05 mem: 47% pow: 639.126 W 0: INFO 26-04-29 04:09:47.075834 - 2:52:15 - step: 7200 acc: 0 loss: 1.8402 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6538 data: 0.0692 lr: 6.37e-05 mem: 47% pow: 634.312 W 0: INFO 26-04-29 04:10:08.164107 - 2:52:36 - step: 7210 acc: 0 loss: 1.381 grad: 1.53e-01 flops: 2.68e+14 wps: 3.11e+04 iter: 0.6298 data: 0.0663 lr: 6.37e-05 mem: 54% pow: 646.233 W 0: INFO 26-04-29 04:10:21.640493 - 2:52:50 - step: 7220 acc: 0 loss: 1.4332 grad: 1.50e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6215 data: 0.0635 lr: 6.37e-05 mem: 47% pow: 648.489 W 0: INFO 26-04-29 04:10:35.180644 - 2:53:03 - step: 7230 acc: 0 loss: 1.697 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6531 data: 0.0719 lr: 6.36e-05 mem: 47% pow: 628.223 W 0: INFO 26-04-29 04:10:48.987447 - 2:53:17 - step: 7240 acc: 0 loss: 1.7173 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.619 data: 0.0727 lr: 6.36e-05 mem: 47% pow: 564.09 W 0: INFO 26-04-29 04:11:03.281868 - 2:53:31 - step: 7250 acc: 0 loss: 1.6993 grad: 1.54e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6154 data: 0.0725 lr: 6.36e-05 mem: 47% pow: 655.182 W 0: INFO 26-04-29 04:11:17.146634 - 2:53:45 - step: 7260 acc: 0 loss: 1.6234 grad: 1.58e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.8208 data: 0.0682 lr: 6.36e-05 mem: 47% pow: 541.004 W 0: INFO 26-04-29 04:11:30.907875 - 2:53:59 - step: 7270 acc: 0 loss: 1.5815 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6282 data: 0.0713 lr: 6.36e-05 mem: 47% pow: 637.688 W 0: INFO 26-04-29 04:11:44.950417 - 2:54:13 - step: 7280 acc: 0 loss: 1.2472 grad: 1.55e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6438 data: 0.042 lr: 6.36e-05 mem: 47% pow: 666.906 W 0: INFO 26-04-29 04:11:58.690754 - 2:54:27 - step: 7290 acc: 0 loss: 1.8476 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6147 data: 0.0693 lr: 6.36e-05 mem: 47% pow: 653.645 W 0: INFO 26-04-29 04:12:12.395848 - 2:54:40 - step: 7300 acc: 0 loss: 1.8574 grad: 1.42e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6268 data: 0.0807 lr: 6.35e-05 mem: 47% pow: 637.706 W 0: INFO 26-04-29 04:12:28.965210 - 2:54:57 - step: 7310 acc: 0 loss: 1.5335 grad: 1.60e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6042 data: 0.0718 lr: 6.35e-05 mem: 54% pow: 656.628 W 0: INFO 26-04-29 04:12:42.903124 - 2:55:11 - step: 7320 acc: 0 loss: 1.856 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6211 data: 0.0727 lr: 6.35e-05 mem: 47% pow: 645.238 W 0: INFO 26-04-29 04:12:56.704479 - 2:55:25 - step: 7330 acc: 0 loss: 1.7317 grad: 1.48e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6537 data: 0.0684 lr: 6.35e-05 mem: 47% pow: 643.614 W 0: INFO 26-04-29 04:13:10.802829 - 2:55:39 - step: 7340 acc: 0 loss: 1.3681 grad: 1.51e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6499 data: 0.0595 lr: 6.35e-05 mem: 47% pow: 641.363 W 0: INFO 26-04-29 04:13:24.659158 - 2:55:53 - step: 7350 acc: 0 loss: 1.3968 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5991 data: 0.0824 lr: 6.35e-05 mem: 47% pow: 652.845 W 0: INFO 26-04-29 04:13:39.154928 - 2:56:07 - step: 7360 acc: 0 loss: 1.8652 grad: 1.49e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.5926 data: 0.0908 lr: 6.34e-05 mem: 47% pow: 658.928 W 0: INFO 26-04-29 04:13:52.817239 - 2:56:21 - step: 7370 acc: 0 loss: 1.2932 grad: 1.53e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.624 data: 0.0704 lr: 6.34e-05 mem: 47% pow: 647.578 W 0: INFO 26-04-29 04:14:06.802183 - 2:56:35 - step: 7380 acc: 0 loss: 1.6818 grad: 1.81e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6214 data: 0.0609 lr: 6.34e-05 mem: 47% pow: 655.79 W 0: INFO 26-04-29 04:14:20.800269 - 2:56:49 - step: 7390 acc: 0 loss: 1.6714 grad: 1.45e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6199 data: 0.0643 lr: 6.34e-05 mem: 47% pow: 656.292 W 0: INFO 26-04-29 04:14:34.936432 - 2:57:03 - step: 7400 acc: 0 loss: 1.5306 grad: 1.46e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.7863 data: 0.0715 lr: 6.34e-05 mem: 47% pow: 551.031 W 0: INFO 26-04-29 04:14:51.699148 - 2:57:20 - step: 7410 acc: 0 loss: 1.9551 grad: 1.61e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6137 data: 0.0732 lr: 6.34e-05 mem: 54% pow: 655.584 W 0: INFO 26-04-29 04:15:05.492835 - 2:57:34 - step: 7420 acc: 0 loss: 1.6274 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6105 data: 0.0707 lr: 6.34e-05 mem: 47% pow: 657.048 W 0: INFO 26-04-29 04:15:19.237270 - 2:57:47 - step: 7430 acc: 0 loss: 1.5167 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6447 data: 0.0669 lr: 6.33e-05 mem: 47% pow: 646.488 W 0: INFO 26-04-29 04:15:33.149634 - 2:58:01 - step: 7440 acc: 0 loss: 1.5207 grad: 1.52e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6833 data: 0.0662 lr: 6.33e-05 mem: 47% pow: 618.321 W 0: INFO 26-04-29 04:15:48.675568 - 2:58:17 - step: 7450 acc: 0 loss: 1.7548 grad: 1.66e-01 flops: 3.64e+14 wps: 4.22e+04 iter: 0.6064 data: 0.0768 lr: 6.33e-05 mem: 47% pow: 657.418 W 0: INFO 26-04-29 04:16:02.580576 - 2:58:31 - step: 7460 acc: 0 loss: 2.1885 grad: 1.65e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.7272 data: 0.0756 lr: 6.33e-05 mem: 47% pow: 592.365 W 0: INFO 26-04-29 04:16:16.528860 - 2:58:45 - step: 7470 acc: 0 loss: 1.5406 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6425 data: 0.0718 lr: 6.33e-05 mem: 47% pow: 631.158 W 0: INFO 26-04-29 04:16:30.281108 - 2:58:58 - step: 7480 acc: 0 loss: 1.5837 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6243 data: 0.0709 lr: 6.33e-05 mem: 47% pow: 648.769 W 0: INFO 26-04-29 04:16:43.945343 - 2:59:12 - step: 7490 acc: 0 loss: 1.5445 grad: 1.73e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6106 data: 0.058 lr: 6.33e-05 mem: 47% pow: 668.12 W 0: INFO 26-04-29 04:16:57.942923 - 2:59:26 - step: 7500 acc: 0 loss: 1.6091 grad: 1.60e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6241 data: 0.0645 lr: 6.32e-05 mem: 47% pow: 659.28 W 0: INFO 26-04-29 04:17:14.904405 - 2:59:43 - step: 7510 acc: 0 loss: 2.0607 grad: 1.60e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.5956 data: 0.0894 lr: 6.32e-05 mem: 54% pow: 649.925 W 0: INFO 26-04-29 04:17:28.849998 - 2:59:57 - step: 7520 acc: 0 loss: 1.7486 grad: 1.52e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6283 data: 0.0442 lr: 6.32e-05 mem: 47% pow: 658.173 W 0: INFO 26-04-29 04:17:42.561938 - 3:00:11 - step: 7530 acc: 0 loss: 1.4828 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6184 data: 0.0724 lr: 6.32e-05 mem: 47% pow: 666.276 W 0: INFO 26-04-29 04:17:56.237126 - 3:00:24 - step: 7540 acc: 0 loss: 1.8978 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6596 data: 0.0629 lr: 6.32e-05 mem: 47% pow: 627.2 W 0: INFO 26-04-29 04:18:10.114625 - 3:00:38 - step: 7550 acc: 0 loss: 1.8678 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6564 data: 0.0502 lr: 6.32e-05 mem: 47% pow: 641.383 W 0: INFO 26-04-29 04:18:24.124218 - 3:00:52 - step: 7560 acc: 0 loss: 1.711 grad: 1.67e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.9337 data: 0.0703 lr: 6.32e-05 mem: 47% pow: 475.397 W 0: INFO 26-04-29 04:18:37.648233 - 3:01:06 - step: 7570 acc: 0 loss: 1.7111 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6668 data: 0.0125 lr: 6.31e-05 mem: 47% pow: 670.036 W 0: INFO 26-04-29 04:18:51.171926 - 3:01:19 - step: 7580 acc: 0 loss: 1.7746 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6242 data: 0.0716 lr: 6.31e-05 mem: 47% pow: 649.021 W 0: INFO 26-04-29 04:19:05.098252 - 3:01:33 - step: 7590 acc: 0 loss: 1.2699 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6306 data: 0.072 lr: 6.31e-05 mem: 47% pow: 646.182 W 0: INFO 26-04-29 04:19:19.019122 - 3:01:47 - step: 7600 acc: 0 loss: 1.8115 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6561 data: 0.0699 lr: 6.31e-05 mem: 47% pow: 646.94 W 0: INFO 26-04-29 04:19:35.782306 - 3:02:04 - step: 7610 acc: 0 loss: 1.9178 grad: 1.52e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.608 data: 0.0728 lr: 6.31e-05 mem: 54% pow: 651.274 W 0: INFO 26-04-29 04:19:49.702680 - 3:02:18 - step: 7620 acc: 0 loss: 1.393 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6214 data: 0.0756 lr: 6.31e-05 mem: 47% pow: 661.681 W 0: INFO 26-04-29 04:20:03.571094 - 3:02:32 - step: 7630 acc: 0 loss: 1.5967 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6234 data: 0.068 lr: 6.30e-05 mem: 47% pow: 659.504 W 0: INFO 26-04-29 04:20:17.579156 - 3:02:46 - step: 7640 acc: 0 loss: 1.6119 grad: 1.54e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.7138 data: 0.0742 lr: 6.30e-05 mem: 47% pow: 601.253 W 0: INFO 26-04-29 04:20:31.129822 - 3:02:59 - step: 7650 acc: 0 loss: 1.4947 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6049 data: 0.0668 lr: 6.30e-05 mem: 47% pow: 667.117 W 0: INFO 26-04-29 04:20:44.879330 - 3:03:13 - step: 7660 acc: 0 loss: 1.9088 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6793 data: 0.065 lr: 6.30e-05 mem: 47% pow: 622.538 W 0: INFO 26-04-29 04:20:58.792261 - 3:03:27 - step: 7670 acc: 0 loss: 1.4861 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6611 data: 0.0721 lr: 6.30e-05 mem: 47% pow: 619.323 W 0: INFO 26-04-29 04:21:12.385466 - 3:03:40 - step: 7680 acc: 0 loss: 1.6952 grad: 1.56e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6271 data: 0.0612 lr: 6.30e-05 mem: 47% pow: 660.323 W 0: INFO 26-04-29 04:21:26.855951 - 3:03:55 - step: 7690 acc: 0 loss: 1.6208 grad: 1.51e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6323 data: 0.0826 lr: 6.30e-05 mem: 47% pow: 643.45 W 0: INFO 26-04-29 04:21:40.480009 - 3:04:09 - step: 7700 acc: 0 loss: 1.8182 grad: 1.52e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6099 data: 0.0747 lr: 6.29e-05 mem: 47% pow: 655.05 W 0: INFO 26-04-29 04:21:57.127929 - 3:04:25 - step: 7710 acc: 0 loss: 1.8892 grad: 1.47e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6362 data: 0.1065 lr: 6.29e-05 mem: 54% pow: 618.841 W 0: INFO 26-04-29 04:22:11.141802 - 3:04:39 - step: 7720 acc: 0 loss: 1.6327 grad: 1.52e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6323 data: 0.0712 lr: 6.29e-05 mem: 47% pow: 646.569 W 0: INFO 26-04-29 04:22:25.109427 - 3:04:53 - step: 7730 acc: 0 loss: 1.5687 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6483 data: 0.0682 lr: 6.29e-05 mem: 47% pow: 635.511 W 0: INFO 26-04-29 04:22:39.088965 - 3:05:07 - step: 7740 acc: 0 loss: 1.7482 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6521 data: 0.0617 lr: 6.29e-05 mem: 47% pow: 637.721 W 0: INFO 26-04-29 04:22:52.906347 - 3:05:21 - step: 7750 acc: 0 loss: 1.7314 grad: 1.54e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6027 data: 0.0809 lr: 6.29e-05 mem: 47% pow: 653.177 W 0: INFO 26-04-29 04:23:06.421420 - 3:05:35 - step: 7760 acc: 0 loss: 1.7422 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6034 data: 0.0793 lr: 6.29e-05 mem: 47% pow: 659.608 W 0: INFO 26-04-29 04:23:20.041825 - 3:05:48 - step: 7770 acc: 0 loss: 1.9796 grad: 1.42e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6378 data: 0.066 lr: 6.28e-05 mem: 47% pow: 636.486 W 0: INFO 26-04-29 04:23:33.943436 - 3:06:02 - step: 7780 acc: 0 loss: 1.724 grad: 1.51e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6103 data: 0.0713 lr: 6.28e-05 mem: 47% pow: 655.899 W 0: INFO 26-04-29 04:23:47.492431 - 3:06:16 - step: 7790 acc: 0 loss: 1.559 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6353 data: 0.0721 lr: 6.28e-05 mem: 47% pow: 640.728 W 0: INFO 26-04-29 04:24:01.096058 - 3:06:29 - step: 7800 acc: 0 loss: 1.8321 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6891 data: 0.0638 lr: 6.28e-05 mem: 47% pow: 622.474 W 0: INFO 26-04-29 04:24:17.751066 - 3:06:46 - step: 7810 acc: 0 loss: 1.5388 grad: 1.51e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.7518 data: 0.0688 lr: 6.28e-05 mem: 54% pow: 580.579 W 0: INFO 26-04-29 04:24:31.500452 - 3:07:00 - step: 7820 acc: 0 loss: 1.4496 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6177 data: 0.0722 lr: 6.28e-05 mem: 47% pow: 658.931 W 0: INFO 26-04-29 04:24:45.268029 - 3:07:13 - step: 7830 acc: 0 loss: 1.4844 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6208 data: 0.0695 lr: 6.28e-05 mem: 47% pow: 655.467 W 0: INFO 26-04-29 04:24:59.129030 - 3:07:27 - step: 7840 acc: 0 loss: 1.749 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6946 data: 0.0751 lr: 6.27e-05 mem: 47% pow: 607.046 W 0: INFO 26-04-29 04:25:12.853636 - 3:07:41 - step: 7850 acc: 0 loss: 1.4757 grad: 1.44e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6158 data: 0.0728 lr: 6.27e-05 mem: 47% pow: 651.887 W 0: INFO 26-04-29 04:25:26.833500 - 3:07:55 - step: 7860 acc: 0 loss: 1.569 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5949 data: 0.0803 lr: 6.27e-05 mem: 47% pow: 666.28 W 0: INFO 26-04-29 04:25:40.841364 - 3:08:09 - step: 7870 acc: 0 loss: 1.5808 grad: 1.52e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6952 data: 0.0203 lr: 6.27e-05 mem: 47% pow: 642.586 W 0: INFO 26-04-29 04:25:54.497870 - 3:08:23 - step: 7880 acc: 0 loss: 1.4344 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6564 data: 0.072 lr: 6.27e-05 mem: 47% pow: 636.739 W 0: INFO 26-04-29 04:26:08.292521 - 3:08:36 - step: 7890 acc: 0 loss: 1.3709 grad: 1.48e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6414 data: 0.0671 lr: 6.27e-05 mem: 47% pow: 648.467 W 0: INFO 26-04-29 04:26:22.137279 - 3:08:50 - step: 7900 acc: 0 loss: 1.734 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.7117 data: 0.0672 lr: 6.26e-05 mem: 47% pow: 605.159 W 0: INFO 26-04-29 04:26:38.713922 - 3:09:07 - step: 7910 acc: 0 loss: 1.754 grad: 1.50e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.5965 data: 0.0705 lr: 6.26e-05 mem: 54% pow: 666.169 W 0: INFO 26-04-29 04:26:52.386999 - 3:09:20 - step: 7920 acc: 0 loss: 1.6597 grad: 1.57e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6051 data: 0.0825 lr: 6.26e-05 mem: 47% pow: 650.954 W 0: INFO 26-04-29 04:27:06.524756 - 3:09:35 - step: 7930 acc: 0 loss: 1.6207 grad: 1.44e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.58 data: 0.2039 lr: 6.26e-05 mem: 47% pow: 606.199 W 0: INFO 26-04-29 04:27:20.029307 - 3:09:48 - step: 7940 acc: 0 loss: 1.6834 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6145 data: 0.0727 lr: 6.26e-05 mem: 47% pow: 655.818 W 0: INFO 26-04-29 04:27:33.723989 - 3:10:02 - step: 7950 acc: 0 loss: 1.7178 grad: 1.45e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6431 data: 0.0735 lr: 6.26e-05 mem: 47% pow: 628.721 W 0: INFO 26-04-29 04:27:47.788073 - 3:10:16 - step: 7960 acc: 0 loss: 1.5321 grad: 1.47e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.7095 data: 0.0703 lr: 6.26e-05 mem: 47% pow: 595.673 W 0: INFO 26-04-29 04:28:01.497433 - 3:10:30 - step: 7970 acc: 0 loss: 1.6686 grad: 1.42e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6222 data: 0.067 lr: 6.25e-05 mem: 47% pow: 666.185 W 0: INFO 26-04-29 04:28:15.234368 - 3:10:43 - step: 7980 acc: 0 loss: 1.5067 grad: 1.54e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6554 data: 0.0678 lr: 6.25e-05 mem: 47% pow: 633.293 W 0: INFO 26-04-29 04:28:29.979665 - 3:10:58 - step: 7990 acc: 0 loss: 1.624 grad: 1.51e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6268 data: 0.0697 lr: 6.25e-05 mem: 47% pow: 649.353 W 0: INFO 26-04-29 04:28:43.851867 - 3:11:12 - step: 8000 acc: 0 loss: 1.554 grad: 1.55e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6154 data: 0.0694 lr: 6.25e-05 mem: 47% pow: 653.219 W 0: INFO 26-04-29 04:28:47.507697 - 3:11:16 - garbage collection 0: INFO 26-04-29 04:29:02.065707 - 3:11:30 - step: 8010 acc: 0 loss: 1.4368 grad: 1.56e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.6641 data: 0.0708 lr: 6.25e-05 mem: 54% pow: 625.173 W 0: INFO 26-04-29 04:29:15.692604 - 3:11:44 - step: 8020 acc: 0 loss: 1.7108 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6185 data: 0.0509 lr: 6.25e-05 mem: 47% pow: 664.687 W 0: INFO 26-04-29 04:29:29.529827 - 3:11:58 - step: 8030 acc: 0 loss: 1.4547 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6449 data: 0.0659 lr: 6.25e-05 mem: 47% pow: 637.588 W 0: INFO 26-04-29 04:29:43.028848 - 3:12:11 - step: 8040 acc: 0 loss: 1.319 grad: 1.50e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6339 data: 0.0703 lr: 6.24e-05 mem: 47% pow: 641.372 W 0: INFO 26-04-29 04:29:56.585502 - 3:12:25 - step: 8050 acc: 0 loss: 1.5114 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6273 data: 0.067 lr: 6.24e-05 mem: 47% pow: 649.428 W 0: INFO 26-04-29 04:30:10.387925 - 3:12:38 - step: 8060 acc: 0 loss: 1.788 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6058 data: 0.0733 lr: 6.24e-05 mem: 47% pow: 648.209 W 0: INFO 26-04-29 04:30:24.520338 - 3:12:53 - step: 8070 acc: 0 loss: 1.561 grad: 1.52e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6257 data: 0.0736 lr: 6.24e-05 mem: 47% pow: 644.04 W 0: INFO 26-04-29 04:30:38.070116 - 3:13:06 - step: 8080 acc: 0 loss: 1.2974 grad: 1.45e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6235 data: 0.0676 lr: 6.24e-05 mem: 47% pow: 656.973 W 0: INFO 26-04-29 04:30:51.804833 - 3:13:20 - step: 8090 acc: 0 loss: 1.5762 grad: 1.45e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6874 data: 0.0713 lr: 6.24e-05 mem: 47% pow: 607.264 W 0: INFO 26-04-29 04:31:05.364949 - 3:13:33 - step: 8100 acc: 0 loss: 2.0229 grad: 1.53e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6099 data: 0.0715 lr: 6.23e-05 mem: 47% pow: 639.636 W 0: INFO 26-04-29 04:31:21.923239 - 3:13:50 - step: 8110 acc: 0 loss: 1.6423 grad: 1.43e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6023 data: 0.0746 lr: 6.23e-05 mem: 54% pow: 657.675 W 0: INFO 26-04-29 04:31:35.629251 - 3:14:04 - step: 8120 acc: 0 loss: 1.9332 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6229 data: 0.0644 lr: 6.23e-05 mem: 47% pow: 654.862 W 0: INFO 26-04-29 04:31:49.150850 - 3:14:17 - step: 8130 acc: 0 loss: 1.6256 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6444 data: 0.0759 lr: 6.23e-05 mem: 47% pow: 636.966 W 0: INFO 26-04-29 04:32:02.975936 - 3:14:31 - step: 8140 acc: 0 loss: 1.761 grad: 1.48e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.624 data: 0.0911 lr: 6.23e-05 mem: 47% pow: 642.527 W 0: INFO 26-04-29 04:32:16.640529 - 3:14:45 - step: 8150 acc: 0 loss: 1.4573 grad: 1.51e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6471 data: 0.07 lr: 6.23e-05 mem: 47% pow: 626.06 W 0: INFO 26-04-29 04:32:30.597964 - 3:14:59 - step: 8160 acc: 0 loss: 1.5342 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6639 data: 0.0703 lr: 6.23e-05 mem: 47% pow: 622.629 W 0: INFO 26-04-29 04:32:44.407125 - 3:15:12 - step: 8170 acc: 0 loss: 1.3298 grad: 1.65e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5793 data: 0.1073 lr: 6.22e-05 mem: 47% pow: 653.403 W 0: INFO 26-04-29 04:32:57.917347 - 3:15:26 - step: 8180 acc: 0 loss: 1.7265 grad: 1.61e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6633 data: 0.0415 lr: 6.22e-05 mem: 47% pow: 647.614 W 0: INFO 26-04-29 04:33:11.814712 - 3:15:40 - step: 8190 acc: 0 loss: 1.7463 grad: 1.50e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6273 data: 0.0725 lr: 6.22e-05 mem: 47% pow: 633.979 W 0: INFO 26-04-29 04:33:25.547382 - 3:15:54 - step: 8200 acc: 0 loss: 1.2207 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7075 data: 0.0705 lr: 6.22e-05 mem: 47% pow: 599.298 W 0: INFO 26-04-29 04:33:42.328951 - 3:16:10 - step: 8210 acc: 0 loss: 1.559 grad: 1.66e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6679 data: 0.0735 lr: 6.22e-05 mem: 54% pow: 620.915 W 0: INFO 26-04-29 04:33:56.251422 - 3:16:24 - step: 8220 acc: 0 loss: 1.4911 grad: 1.58e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7851 data: 0.077 lr: 6.22e-05 mem: 47% pow: 552.794 W 0: INFO 26-04-29 04:34:10.128996 - 3:16:38 - step: 8230 acc: 0 loss: 1.2525 grad: 1.55e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6156 data: 0.0715 lr: 6.22e-05 mem: 47% pow: 647.57 W 0: INFO 26-04-29 04:34:23.981231 - 3:16:52 - step: 8240 acc: 0 loss: 1.6674 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6334 data: 0.0664 lr: 6.21e-05 mem: 47% pow: 645.052 W 0: INFO 26-04-29 04:34:37.940706 - 3:17:06 - step: 8250 acc: 0 loss: 1.2309 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6355 data: 0.0807 lr: 6.21e-05 mem: 47% pow: 628.526 W 0: INFO 26-04-29 04:34:51.520509 - 3:17:20 - step: 8260 acc: 0 loss: 1.4715 grad: 1.48e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6256 data: 0.0721 lr: 6.21e-05 mem: 47% pow: 650.267 W 0: INFO 26-04-29 04:35:05.127498 - 3:17:33 - step: 8270 acc: 0 loss: 1.7064 grad: 1.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6615 data: 0.0782 lr: 6.21e-05 mem: 47% pow: 624.317 W 0: INFO 26-04-29 04:35:18.717367 - 3:17:47 - step: 8280 acc: 0 loss: 1.4686 grad: 1.48e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6593 data: 0.0677 lr: 6.21e-05 mem: 47% pow: 639.142 W 0: INFO 26-04-29 04:35:32.228302 - 3:18:00 - step: 8290 acc: 0 loss: 1.6231 grad: 1.51e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6168 data: 0.0638 lr: 6.21e-05 mem: 47% pow: 656.512 W 0: INFO 26-04-29 04:35:46.779303 - 3:18:15 - step: 8300 acc: 0 loss: 1.4171 grad: 1.53e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.8605 data: 0.0692 lr: 6.21e-05 mem: 47% pow: 509.791 W 0: INFO 26-04-29 04:36:07.141640 - 3:18:35 - step: 8310 acc: 0 loss: 1.3917 grad: 1.47e-01 flops: 2.77e+14 wps: 3.22e+04 iter: 0.6197 data: 0.0692 lr: 6.20e-05 mem: 54% pow: 621.128 W 0: INFO 26-04-29 04:36:21.589728 - 3:18:50 - step: 8320 acc: 0 loss: 1.737 grad: 1.48e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.628 data: 0.0668 lr: 6.20e-05 mem: 47% pow: 648.304 W 0: INFO 26-04-29 04:36:36.160034 - 3:19:04 - step: 8330 acc: 0 loss: 1.8113 grad: 1.53e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6299 data: 0.0773 lr: 6.20e-05 mem: 47% pow: 645.171 W 0: INFO 26-04-29 04:36:49.787882 - 3:19:18 - step: 8340 acc: 0 loss: 1.5262 grad: 1.62e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6129 data: 0.0698 lr: 6.20e-05 mem: 47% pow: 651.688 W 0: INFO 26-04-29 04:37:03.712221 - 3:19:32 - step: 8350 acc: 0 loss: 1.5659 grad: 1.56e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7624 data: 0.0795 lr: 6.20e-05 mem: 47% pow: 581.311 W 0: INFO 26-04-29 04:37:17.656829 - 3:19:46 - step: 8360 acc: 0 loss: 1.8101 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6607 data: 0.0705 lr: 6.20e-05 mem: 47% pow: 637.765 W 0: INFO 26-04-29 04:37:31.407907 - 3:19:59 - step: 8370 acc: 0 loss: 1.6959 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6136 data: 0.0703 lr: 6.19e-05 mem: 47% pow: 652.448 W 0: INFO 26-04-29 04:37:44.893445 - 3:20:13 - step: 8380 acc: 0 loss: 1.9135 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.636 data: 0.0552 lr: 6.19e-05 mem: 47% pow: 645.532 W 0: INFO 26-04-29 04:37:58.531809 - 3:20:27 - step: 8390 acc: 0 loss: 1.8029 grad: 1.56e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6683 data: 0.0693 lr: 6.19e-05 mem: 47% pow: 626.974 W 0: INFO 26-04-29 04:38:12.113384 - 3:20:40 - step: 8400 acc: 0 loss: 1.6778 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5789 data: 0.1004 lr: 6.19e-05 mem: 47% pow: 656.139 W 0: INFO 26-04-29 04:38:28.773789 - 3:20:57 - step: 8410 acc: 0 loss: 1.674 grad: 1.44e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6897 data: 0.0025 lr: 6.19e-05 mem: 54% pow: 657.943 W 0: INFO 26-04-29 04:38:42.488377 - 3:21:11 - step: 8420 acc: 0 loss: 1.409 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6398 data: 0.0702 lr: 6.19e-05 mem: 47% pow: 658.392 W 0: INFO 26-04-29 04:38:56.080669 - 3:21:24 - step: 8430 acc: 0 loss: 1.5604 grad: 1.54e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6108 data: 0.0677 lr: 6.19e-05 mem: 47% pow: 653.32 W 0: INFO 26-04-29 04:39:09.843247 - 3:21:38 - step: 8440 acc: 0 loss: 1.5623 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6079 data: 0.0715 lr: 6.18e-05 mem: 47% pow: 650.17 W 0: INFO 26-04-29 04:39:23.441046 - 3:21:52 - step: 8450 acc: 0 loss: 1.6477 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6198 data: 0.0591 lr: 6.18e-05 mem: 47% pow: 650.481 W 0: INFO 26-04-29 04:39:37.144613 - 3:22:05 - step: 8460 acc: 0 loss: 1.6938 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6056 data: 0.0762 lr: 6.18e-05 mem: 47% pow: 651.583 W 0: INFO 26-04-29 04:39:50.873924 - 3:22:19 - step: 8470 acc: 0 loss: 1.7126 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6574 data: 0.0782 lr: 6.18e-05 mem: 47% pow: 635.23 W 0: INFO 26-04-29 04:40:04.349263 - 3:22:32 - step: 8480 acc: 0 loss: 1.6335 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6284 data: 0.0586 lr: 6.18e-05 mem: 47% pow: 657.129 W 0: INFO 26-04-29 04:40:18.272120 - 3:22:46 - step: 8490 acc: 0 loss: 1.34 grad: 1.51e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6016 data: 0.0757 lr: 6.18e-05 mem: 47% pow: 653.017 W 0: INFO 26-04-29 04:40:32.303789 - 3:23:00 - step: 8500 acc: 0 loss: 1.5238 grad: 1.50e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6192 data: 0.0764 lr: 6.18e-05 mem: 47% pow: 646.096 W 0: INFO 26-04-29 04:40:49.151487 - 3:23:17 - step: 8510 acc: 0 loss: 1.7313 grad: 1.46e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6165 data: 0.0644 lr: 6.17e-05 mem: 54% pow: 652.066 W 0: INFO 26-04-29 04:41:02.884654 - 3:23:31 - step: 8520 acc: 0 loss: 1.7521 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6399 data: 0.0735 lr: 6.17e-05 mem: 47% pow: 652.555 W 0: INFO 26-04-29 04:41:16.616518 - 3:23:45 - step: 8530 acc: 0 loss: 1.5627 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6019 data: 0.0726 lr: 6.17e-05 mem: 47% pow: 663.509 W 0: INFO 26-04-29 04:41:30.555571 - 3:23:59 - step: 8540 acc: 0 loss: 1.4296 grad: 1.44e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7638 data: 0.0644 lr: 6.17e-05 mem: 47% pow: 575.854 W 0: INFO 26-04-29 04:41:44.003798 - 3:24:12 - step: 8550 acc: 0 loss: 1.5223 grad: 1.56e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6091 data: 0.0698 lr: 6.17e-05 mem: 47% pow: 659.027 W 0: INFO 26-04-29 04:41:57.793528 - 3:24:26 - step: 8560 acc: 0 loss: 1.7679 grad: 1.53e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6078 data: 0.0788 lr: 6.17e-05 mem: 47% pow: 657.261 W 0: INFO 26-04-29 04:42:11.435852 - 3:24:40 - step: 8570 acc: 0 loss: 1.5182 grad: 1.48e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6355 data: 0.0741 lr: 6.16e-05 mem: 47% pow: 646.813 W 0: INFO 26-04-29 04:42:25.193915 - 3:24:53 - step: 8580 acc: 0 loss: 1.5381 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6105 data: 0.07 lr: 6.16e-05 mem: 47% pow: 651.562 W 0: INFO 26-04-29 04:42:38.785912 - 3:25:07 - step: 8590 acc: 0 loss: 1.6996 grad: 1.50e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6248 data: 0.0744 lr: 6.16e-05 mem: 47% pow: 640.106 W 0: INFO 26-04-29 04:42:52.376240 - 3:25:20 - step: 8600 acc: 0 loss: 1.9073 grad: 1.51e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6323 data: 0.0693 lr: 6.16e-05 mem: 47% pow: 642.38 W 0: INFO 26-04-29 04:43:08.994760 - 3:25:37 - step: 8610 acc: 0 loss: 1.8242 grad: 1.47e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6384 data: 0.0713 lr: 6.16e-05 mem: 54% pow: 638.537 W 0: INFO 26-04-29 04:43:23.101015 - 3:25:51 - step: 8620 acc: 0 loss: 1.7171 grad: 1.53e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.5953 data: 0.0815 lr: 6.16e-05 mem: 47% pow: 662.932 W 0: INFO 26-04-29 04:43:37.036380 - 3:26:05 - step: 8630 acc: 0 loss: 1.6555 grad: 1.93e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6011 data: 0.0839 lr: 6.16e-05 mem: 47% pow: 658.123 W 0: INFO 26-04-29 04:43:50.633783 - 3:26:19 - step: 8640 acc: 0 loss: 1.7955 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6104 data: 0.0758 lr: 6.15e-05 mem: 47% pow: 649.106 W 0: INFO 26-04-29 04:44:04.179854 - 3:26:32 - step: 8650 acc: 0 loss: 1.7218 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.62 data: 0.0597 lr: 6.15e-05 mem: 47% pow: 655.658 W 0: INFO 26-04-29 04:44:17.747205 - 3:26:46 - step: 8660 acc: 0 loss: 1.5881 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.61 data: 0.077 lr: 6.15e-05 mem: 47% pow: 657.879 W 0: INFO 26-04-29 04:44:31.183073 - 3:26:59 - step: 8670 acc: 0 loss: 1.4748 grad: 1.53e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6375 data: 0.0744 lr: 6.15e-05 mem: 47% pow: 648.841 W 0: INFO 26-04-29 04:44:45.027287 - 3:27:13 - step: 8680 acc: 0 loss: 1.4855 grad: 1.47e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.8323 data: 0.0696 lr: 6.15e-05 mem: 47% pow: 525.775 W 0: INFO 26-04-29 04:44:58.728316 - 3:27:27 - step: 8690 acc: 0 loss: 1.2724 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6399 data: 0.0712 lr: 6.15e-05 mem: 47% pow: 645.762 W 0: INFO 26-04-29 04:45:12.224157 - 3:27:40 - step: 8700 acc: 0 loss: 1.4537 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6215 data: 0.0664 lr: 6.15e-05 mem: 47% pow: 660.283 W 0: INFO 26-04-29 04:45:29.041957 - 3:27:57 - step: 8710 acc: 0 loss: 1.5246 grad: 1.80e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6503 data: 0.0435 lr: 6.14e-05 mem: 54% pow: 667.164 W 0: INFO 26-04-29 04:45:42.886207 - 3:28:11 - step: 8720 acc: 0 loss: 1.6437 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6375 data: 0.0693 lr: 6.14e-05 mem: 47% pow: 646.249 W 0: INFO 26-04-29 04:45:56.522490 - 3:28:25 - step: 8730 acc: 0 loss: 1.5361 grad: 1.46e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6026 data: 0.0794 lr: 6.14e-05 mem: 47% pow: 653.921 W 0: INFO 26-04-29 04:46:10.017738 - 3:28:38 - step: 8740 acc: 0 loss: 1.4367 grad: 1.59e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6211 data: 0.0734 lr: 6.14e-05 mem: 47% pow: 656.238 W 0: INFO 26-04-29 04:46:24.479012 - 3:28:53 - step: 8750 acc: 0 loss: 1.5621 grad: 1.52e-01 flops: 3.91e+14 wps: 4.53e+04 iter: 0.6104 data: 0.0701 lr: 6.14e-05 mem: 47% pow: 666.089 W 0: INFO 26-04-29 04:46:38.167149 - 3:29:06 - step: 8760 acc: 0 loss: 1.4625 grad: 1.49e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6535 data: 0.0693 lr: 6.14e-05 mem: 47% pow: 628.245 W 0: INFO 26-04-29 04:46:51.721670 - 3:29:20 - step: 8770 acc: 0 loss: 1.232 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6047 data: 0.0735 lr: 6.14e-05 mem: 47% pow: 654.802 W 0: INFO 26-04-29 04:47:05.406534 - 3:29:33 - step: 8780 acc: 0 loss: 1.5639 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.611 data: 0.0612 lr: 6.13e-05 mem: 47% pow: 656.878 W 0: INFO 26-04-29 04:47:19.422240 - 3:29:48 - step: 8790 acc: 0 loss: 1.5223 grad: 1.65e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.629 data: 0.0731 lr: 6.13e-05 mem: 47% pow: 643.657 W 0: INFO 26-04-29 04:47:33.258469 - 3:30:01 - step: 8800 acc: 0 loss: 1.4683 grad: 1.45e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.645 data: 0.0682 lr: 6.13e-05 mem: 47% pow: 635.727 W 0: INFO 26-04-29 04:47:49.830364 - 3:30:18 - step: 8810 acc: 0 loss: 1.4499 grad: 1.48e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6028 data: 0.0781 lr: 6.13e-05 mem: 54% pow: 649.105 W 0: INFO 26-04-29 04:48:03.706252 - 3:30:32 - step: 8820 acc: 0 loss: 1.5373 grad: 1.65e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6415 data: 0.0693 lr: 6.13e-05 mem: 47% pow: 649.896 W 0: INFO 26-04-29 04:48:17.293278 - 3:30:45 - step: 8830 acc: 0 loss: 1.5744 grad: 1.63e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6658 data: 0.0462 lr: 6.13e-05 mem: 47% pow: 650.55 W 0: INFO 26-04-29 04:48:30.910826 - 3:30:59 - step: 8840 acc: 0 loss: 1.3162 grad: 1.59e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6404 data: 0.072 lr: 6.12e-05 mem: 47% pow: 632.539 W 0: INFO 26-04-29 04:48:44.395767 - 3:31:12 - step: 8850 acc: 0 loss: 1.4385 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6079 data: 0.0631 lr: 6.12e-05 mem: 47% pow: 671.859 W 0: INFO 26-04-29 04:48:57.953643 - 3:31:26 - step: 8860 acc: 0 loss: 1.2677 grad: 1.53e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6136 data: 0.0768 lr: 6.12e-05 mem: 47% pow: 652.762 W 0: INFO 26-04-29 04:49:11.514882 - 3:31:40 - step: 8870 acc: 0 loss: 1.5552 grad: 1.50e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.683 data: 0.0707 lr: 6.12e-05 mem: 47% pow: 612.652 W 0: INFO 26-04-29 04:49:25.127039 - 3:31:53 - step: 8880 acc: 0 loss: 1.3542 grad: 1.56e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.612 data: 0.0678 lr: 6.12e-05 mem: 47% pow: 658.502 W 0: INFO 26-04-29 04:49:38.908093 - 3:32:07 - step: 8890 acc: 0 loss: 1.6007 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6177 data: 0.072 lr: 6.12e-05 mem: 47% pow: 657.543 W 0: INFO 26-04-29 04:49:52.601490 - 3:32:21 - step: 8900 acc: 0 loss: 1.6162 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6129 data: 0.0683 lr: 6.12e-05 mem: 47% pow: 654.575 W 0: INFO 26-04-29 04:50:09.262780 - 3:32:37 - step: 8910 acc: 0 loss: 1.5946 grad: 1.54e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.607 data: 0.0733 lr: 6.11e-05 mem: 54% pow: 653.081 W 0: INFO 26-04-29 04:50:22.891929 - 3:32:51 - step: 8920 acc: 0 loss: 1.6693 grad: 1.50e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6123 data: 0.0669 lr: 6.11e-05 mem: 47% pow: 688.101 W 0: INFO 26-04-29 04:50:36.340994 - 3:33:04 - step: 8930 acc: 0 loss: 1.3116 grad: 1.65e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6152 data: 0.0751 lr: 6.11e-05 mem: 47% pow: 657.961 W 0: INFO 26-04-29 04:50:50.002580 - 3:33:18 - step: 8940 acc: 0 loss: 1.6551 grad: 1.62e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6029 data: 0.074 lr: 6.11e-05 mem: 47% pow: 656.116 W 0: INFO 26-04-29 04:51:03.723967 - 3:33:32 - step: 8950 acc: 0 loss: 1.5696 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6448 data: 0.0717 lr: 6.11e-05 mem: 47% pow: 644.625 W 0: INFO 26-04-29 04:51:17.489343 - 3:33:46 - step: 8960 acc: 0 loss: 1.5054 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6334 data: 0.0703 lr: 6.11e-05 mem: 47% pow: 639.827 W 0: INFO 26-04-29 04:51:31.187013 - 3:33:59 - step: 8970 acc: 0 loss: 1.387 grad: 1.50e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6154 data: 0.0718 lr: 6.11e-05 mem: 47% pow: 656.243 W 0: INFO 26-04-29 04:51:44.743187 - 3:34:13 - step: 8980 acc: 0 loss: 1.7218 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6269 data: 0.071 lr: 6.10e-05 mem: 47% pow: 641.999 W 0: INFO 26-04-29 04:51:58.626724 - 3:34:27 - step: 8990 acc: 0 loss: 1.357 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6135 data: 0.071 lr: 6.10e-05 mem: 47% pow: 654.063 W 0: INFO 26-04-29 04:52:12.184263 - 3:34:40 - step: 9000 acc: 0 loss: 1.3272 grad: 1.62e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6018 data: 0.0802 lr: 6.10e-05 mem: 47% pow: 648.872 W 0: INFO 26-04-29 04:52:15.828423 - 3:34:44 - garbage collection 0: INFO 26-04-29 04:52:30.641378 - 3:34:59 - step: 9010 acc: 0 loss: 1.6601 grad: 1.48e-01 flops: 3.06e+14 wps: 3.55e+04 iter: 0.6128 data: 0.0722 lr: 6.10e-05 mem: 54% pow: 654.706 W 0: INFO 26-04-29 04:52:44.134447 - 3:35:12 - step: 9020 acc: 0 loss: 1.2194 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6152 data: 0.0744 lr: 6.10e-05 mem: 47% pow: 669.289 W 0: INFO 26-04-29 04:52:57.858336 - 3:35:26 - step: 9030 acc: 0 loss: 1.5281 grad: 1.62e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5913 data: 0.0821 lr: 6.10e-05 mem: 47% pow: 669.283 W 0: INFO 26-04-29 04:53:11.601736 - 3:35:40 - step: 9040 acc: 0 loss: 1.3913 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7031 data: 0.0727 lr: 6.09e-05 mem: 47% pow: 610.878 W 0: INFO 26-04-29 04:53:25.166286 - 3:35:53 - step: 9050 acc: 0 loss: 1.3984 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6276 data: 0.0783 lr: 6.09e-05 mem: 47% pow: 639.198 W 0: INFO 26-04-29 04:53:38.710349 - 3:36:07 - step: 9060 acc: 0 loss: 1.3051 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5938 data: 0.0878 lr: 6.09e-05 mem: 47% pow: 672.34 W 0: INFO 26-04-29 04:53:52.570674 - 3:36:21 - step: 9070 acc: 0 loss: 1.5179 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6363 data: 0.0773 lr: 6.09e-05 mem: 47% pow: 641.536 W 0: INFO 26-04-29 04:54:06.326113 - 3:36:34 - step: 9080 acc: 0 loss: 1.6249 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.624 data: 0.0607 lr: 6.09e-05 mem: 47% pow: 650.819 W 0: INFO 26-04-29 04:54:19.772429 - 3:36:48 - step: 9090 acc: 0 loss: 1.7211 grad: 1.41e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6324 data: 0.0532 lr: 6.09e-05 mem: 47% pow: 654.594 W 0: INFO 26-04-29 04:54:33.278273 - 3:37:01 - step: 9100 acc: 0 loss: 1.4086 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6274 data: 0.0715 lr: 6.09e-05 mem: 47% pow: 647.852 W 0: INFO 26-04-29 04:54:49.717083 - 3:37:18 - step: 9110 acc: 0 loss: 1.4629 grad: 1.55e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6354 data: 0.0678 lr: 6.08e-05 mem: 54% pow: 654.621 W 0: INFO 26-04-29 04:55:03.668452 - 3:37:32 - step: 9120 acc: 0 loss: 1.4113 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6122 data: 0.0707 lr: 6.08e-05 mem: 47% pow: 654.862 W 0: INFO 26-04-29 04:55:17.681227 - 3:37:46 - step: 9130 acc: 0 loss: 1.3855 grad: 1.46e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6231 data: 0.0717 lr: 6.08e-05 mem: 47% pow: 651.149 W 0: INFO 26-04-29 04:55:31.673896 - 3:38:00 - step: 9140 acc: 0 loss: 1.8986 grad: 1.43e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6297 data: 0.0622 lr: 6.08e-05 mem: 47% pow: 652.345 W 0: INFO 26-04-29 04:55:45.295622 - 3:38:13 - step: 9150 acc: 0 loss: 1.5289 grad: 1.45e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6087 data: 0.0715 lr: 6.08e-05 mem: 47% pow: 653.34 W 0: INFO 26-04-29 04:55:58.857159 - 3:38:27 - step: 9160 acc: 0 loss: 1.5878 grad: 1.48e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6306 data: 0.0671 lr: 6.08e-05 mem: 47% pow: 643.601 W 0: INFO 26-04-29 04:56:12.278486 - 3:38:40 - step: 9170 acc: 0 loss: 1.8624 grad: 1.47e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6061 data: 0.0736 lr: 6.08e-05 mem: 47% pow: 653.995 W 0: INFO 26-04-29 04:56:26.053589 - 3:38:54 - step: 9180 acc: 0 loss: 1.3948 grad: 1.42e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6205 data: 0.0721 lr: 6.07e-05 mem: 47% pow: 643.984 W 0: INFO 26-04-29 04:56:39.906998 - 3:39:08 - step: 9190 acc: 0 loss: 1.7589 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6109 data: 0.0795 lr: 6.07e-05 mem: 47% pow: 655.739 W 0: INFO 26-04-29 04:56:53.553884 - 3:39:22 - step: 9200 acc: 0 loss: 1.3574 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6087 data: 0.0698 lr: 6.07e-05 mem: 47% pow: 658.039 W 0: INFO 26-04-29 04:57:10.260666 - 3:39:38 - step: 9210 acc: 0 loss: 1.4802 grad: 1.45e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6435 data: 0.0399 lr: 6.07e-05 mem: 54% pow: 676.053 W 0: INFO 26-04-29 04:57:24.289454 - 3:39:52 - step: 9220 acc: 0 loss: 1.4785 grad: 1.44e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6295 data: 0.0586 lr: 6.07e-05 mem: 47% pow: 663.042 W 0: INFO 26-04-29 04:57:38.305137 - 3:40:06 - step: 9230 acc: 0 loss: 1.6193 grad: 1.46e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6124 data: 0.0732 lr: 6.07e-05 mem: 47% pow: 649.222 W 0: INFO 26-04-29 04:57:51.874986 - 3:40:20 - step: 9240 acc: 0 loss: 1.5552 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6479 data: 0.0718 lr: 6.07e-05 mem: 47% pow: 631.591 W 0: INFO 26-04-29 04:58:05.769445 - 3:40:34 - step: 9250 acc: 0 loss: 1.4128 grad: 1.49e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.8582 data: 0.064 lr: 6.06e-05 mem: 47% pow: 521.753 W 0: INFO 26-04-29 04:58:19.407033 - 3:40:47 - step: 9260 acc: 0 loss: 1.2508 grad: 1.49e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.629 data: 0.0627 lr: 6.06e-05 mem: 47% pow: 660.371 W 0: INFO 26-04-29 04:58:33.471781 - 3:41:02 - step: 9270 acc: 0 loss: 1.3588 grad: 1.51e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.608 data: 0.0705 lr: 6.06e-05 mem: 47% pow: 674.0 W 0: INFO 26-04-29 04:58:47.333026 - 3:41:15 - step: 9280 acc: 0 loss: 1.4489 grad: 1.48e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6237 data: 0.0723 lr: 6.06e-05 mem: 47% pow: 647.399 W 0: INFO 26-04-29 04:59:00.896157 - 3:41:29 - step: 9290 acc: 0 loss: 1.5343 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6104 data: 0.071 lr: 6.06e-05 mem: 47% pow: 649.252 W 0: INFO 26-04-29 04:59:14.521537 - 3:41:43 - step: 9300 acc: 0 loss: 1.6609 grad: 1.40e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6483 data: 0.0691 lr: 6.06e-05 mem: 47% pow: 629.409 W 0: INFO 26-04-29 04:59:31.105129 - 3:41:59 - step: 9310 acc: 0 loss: 1.6135 grad: 1.46e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6102 data: 0.0725 lr: 6.05e-05 mem: 54% pow: 653.534 W 0: INFO 26-04-29 04:59:44.745917 - 3:42:13 - step: 9320 acc: 0 loss: 1.5133 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6071 data: 0.0724 lr: 6.05e-05 mem: 47% pow: 653.599 W 0: INFO 26-04-29 04:59:58.365429 - 3:42:26 - step: 9330 acc: 0 loss: 1.949 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6158 data: 0.0859 lr: 6.05e-05 mem: 47% pow: 645.25 W 0: INFO 26-04-29 05:00:12.052885 - 3:42:40 - step: 9340 acc: 0 loss: 1.4879 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6625 data: 0.0663 lr: 6.05e-05 mem: 47% pow: 636.86 W 0: INFO 26-04-29 05:00:25.684769 - 3:42:54 - step: 9350 acc: 0 loss: 1.3409 grad: 1.50e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6158 data: 0.0726 lr: 6.05e-05 mem: 47% pow: 661.041 W 0: INFO 26-04-29 05:00:39.114132 - 3:43:07 - step: 9360 acc: 0 loss: 1.5976 grad: 1.59e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6065 data: 0.0724 lr: 6.05e-05 mem: 47% pow: 655.86 W 0: INFO 26-04-29 05:00:52.869957 - 3:43:21 - step: 9370 acc: 0 loss: 1.4527 grad: 2.10e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6044 data: 0.0703 lr: 6.05e-05 mem: 47% pow: 659.434 W 0: INFO 26-04-29 05:01:06.383767 - 3:43:34 - step: 9380 acc: 0 loss: 1.4112 grad: 1.61e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6114 data: 0.0725 lr: 6.04e-05 mem: 47% pow: 664.147 W 0: INFO 26-04-29 05:01:20.191592 - 3:43:48 - step: 9390 acc: 0 loss: 1.4176 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6517 data: 0.0837 lr: 6.04e-05 mem: 47% pow: 647.937 W 0: INFO 26-04-29 05:01:33.994368 - 3:44:02 - step: 9400 acc: 0 loss: 1.3901 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.628 data: 0.059 lr: 6.04e-05 mem: 47% pow: 654.554 W 0: INFO 26-04-29 05:01:50.529011 - 3:44:19 - step: 9410 acc: 0 loss: 1.7044 grad: 1.55e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6212 data: 0.0672 lr: 6.04e-05 mem: 54% pow: 650.692 W 0: INFO 26-04-29 05:02:04.585764 - 3:44:33 - step: 9420 acc: 0 loss: 1.2401 grad: 1.71e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6128 data: 0.0766 lr: 6.04e-05 mem: 47% pow: 655.51 W 0: INFO 26-04-29 05:02:18.193794 - 3:44:46 - step: 9430 acc: 0 loss: 1.6407 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6236 data: 0.071 lr: 6.04e-05 mem: 47% pow: 649.675 W 0: INFO 26-04-29 05:02:32.142110 - 3:45:00 - step: 9440 acc: 0 loss: 1.7881 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6112 data: 0.073 lr: 6.04e-05 mem: 47% pow: 652.598 W 0: INFO 26-04-29 05:02:45.732523 - 3:45:14 - step: 9450 acc: 0 loss: 1.5957 grad: 1.51e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6091 data: 0.0685 lr: 6.03e-05 mem: 47% pow: 660.608 W 0: INFO 26-04-29 05:02:59.145298 - 3:45:27 - step: 9460 acc: 0 loss: 1.783 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6105 data: 0.0733 lr: 6.03e-05 mem: 47% pow: 654.526 W 0: INFO 26-04-29 05:03:12.942975 - 3:45:41 - step: 9470 acc: 0 loss: 1.8078 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6297 data: 0.079 lr: 6.03e-05 mem: 47% pow: 640.455 W 0: INFO 26-04-29 05:03:26.577754 - 3:45:55 - step: 9480 acc: 0 loss: 1.3634 grad: 1.80e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6134 data: 0.0694 lr: 6.03e-05 mem: 47% pow: 669.292 W 0: INFO 26-04-29 05:03:40.201009 - 3:46:08 - step: 9490 acc: 0 loss: 1.4606 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6095 data: 0.068 lr: 6.03e-05 mem: 47% pow: 658.287 W 0: INFO 26-04-29 05:03:53.870016 - 3:46:22 - step: 9500 acc: 0 loss: 1.3172 grad: 1.55e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6217 data: 0.0668 lr: 6.03e-05 mem: 47% pow: 649.967 W 0: INFO 26-04-29 05:04:10.346119 - 3:46:38 - step: 9510 acc: 0 loss: 1.7327 grad: 1.45e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5974 data: 0.0922 lr: 6.03e-05 mem: 54% pow: 657.458 W 0: INFO 26-04-29 05:04:23.976284 - 3:46:52 - step: 9520 acc: 0 loss: 1.5259 grad: 1.45e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6226 data: 0.0743 lr: 6.02e-05 mem: 47% pow: 653.985 W 0: INFO 26-04-29 05:04:37.565114 - 3:47:06 - step: 9530 acc: 0 loss: 1.3684 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6723 data: 0.0712 lr: 6.02e-05 mem: 47% pow: 618.07 W 0: INFO 26-04-29 05:04:51.032817 - 3:47:19 - step: 9540 acc: 0 loss: 1.2227 grad: 1.48e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6446 data: 0.0731 lr: 6.02e-05 mem: 47% pow: 628.562 W 0: INFO 26-04-29 05:05:04.730244 - 3:47:33 - step: 9550 acc: 0 loss: 1.6108 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6105 data: 0.0759 lr: 6.02e-05 mem: 47% pow: 658.809 W 0: INFO 26-04-29 05:05:18.298582 - 3:47:46 - step: 9560 acc: 0 loss: 1.5858 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6187 data: 0.0646 lr: 6.02e-05 mem: 47% pow: 656.029 W 0: INFO 26-04-29 05:05:31.802039 - 3:48:00 - step: 9570 acc: 0 loss: 1.4709 grad: 1.57e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6311 data: 0.0671 lr: 6.02e-05 mem: 47% pow: 655.16 W 0: INFO 26-04-29 05:05:45.621024 - 3:48:14 - step: 9580 acc: 0 loss: 1.565 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6486 data: 0.0718 lr: 6.01e-05 mem: 47% pow: 628.772 W 0: INFO 26-04-29 05:06:01.368211 - 3:48:29 - step: 9590 acc: 0 loss: 1.3166 grad: 1.50e-01 flops: 3.59e+14 wps: 4.17e+04 iter: 1.0677 data: 0.071 lr: 6.01e-05 mem: 47% pow: 442.505 W 0: INFO 26-04-29 05:06:18.087253 - 3:48:46 - step: 9600 acc: 0 loss: 1.5381 grad: 1.54e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6557 data: 0.066 lr: 6.01e-05 mem: 47% pow: 630.075 W 0: INFO 26-04-29 05:06:34.601263 - 3:49:03 - step: 9610 acc: 0 loss: 1.5405 grad: 1.59e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6076 data: 0.0682 lr: 6.01e-05 mem: 54% pow: 658.04 W 0: INFO 26-04-29 05:06:48.562442 - 3:49:17 - step: 9620 acc: 0 loss: 1.3598 grad: 1.41e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6075 data: 0.074 lr: 6.01e-05 mem: 47% pow: 655.824 W 0: INFO 26-04-29 05:07:02.018127 - 3:49:30 - step: 9630 acc: 0 loss: 1.1477 grad: 1.47e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6068 data: 0.0751 lr: 6.01e-05 mem: 47% pow: 651.105 W 0: INFO 26-04-29 05:07:15.561696 - 3:49:44 - step: 9640 acc: 0 loss: 1.6234 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6131 data: 0.087 lr: 6.01e-05 mem: 47% pow: 637.968 W 0: INFO 26-04-29 05:07:29.049589 - 3:49:57 - step: 9650 acc: 0 loss: 1.3068 grad: 1.48e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5808 data: 0.1312 lr: 6.00e-05 mem: 47% pow: 644.091 W 0: INFO 26-04-29 05:07:42.544262 - 3:50:11 - step: 9660 acc: 0 loss: 1.3441 grad: 1.47e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6256 data: 0.0722 lr: 6.00e-05 mem: 47% pow: 658.565 W 0: INFO 26-04-29 05:07:56.361172 - 3:50:24 - step: 9670 acc: 0 loss: 1.6902 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5987 data: 0.083 lr: 6.00e-05 mem: 47% pow: 656.661 W 0: INFO 26-04-29 05:08:09.989586 - 3:50:38 - step: 9680 acc: 0 loss: 1.5067 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6101 data: 0.0818 lr: 6.00e-05 mem: 47% pow: 658.041 W 0: INFO 26-04-29 05:08:23.844175 - 3:50:52 - step: 9690 acc: 0 loss: 1.4111 grad: 1.52e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6277 data: 0.0637 lr: 6.00e-05 mem: 47% pow: 657.277 W 0: INFO 26-04-29 05:08:37.497478 - 3:51:06 - step: 9700 acc: 0 loss: 1.5221 grad: 1.40e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6627 data: 0.0656 lr: 6.00e-05 mem: 47% pow: 625.918 W 0: INFO 26-04-29 05:08:54.089263 - 3:51:22 - step: 9710 acc: 0 loss: 1.5445 grad: 1.56e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6287 data: 0.0632 lr: 6.00e-05 mem: 54% pow: 643.412 W 0: INFO 26-04-29 05:09:08.001996 - 3:51:36 - step: 9720 acc: 0 loss: 1.2763 grad: 1.55e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6121 data: 0.0717 lr: 5.99e-05 mem: 47% pow: 652.402 W 0: INFO 26-04-29 05:09:22.033681 - 3:51:50 - step: 9730 acc: 0 loss: 1.773 grad: 1.50e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6598 data: 0.0706 lr: 5.99e-05 mem: 47% pow: 629.615 W 0: INFO 26-04-29 05:09:35.786809 - 3:52:04 - step: 9740 acc: 0 loss: 1.362 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6233 data: 0.0675 lr: 5.99e-05 mem: 47% pow: 662.646 W 0: INFO 26-04-29 05:09:49.476998 - 3:52:18 - step: 9750 acc: 0 loss: 1.4793 grad: 1.42e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6186 data: 0.0709 lr: 5.99e-05 mem: 47% pow: 663.97 W 0: INFO 26-04-29 05:10:03.395078 - 3:52:31 - step: 9760 acc: 0 loss: 1.5799 grad: 1.45e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5988 data: 0.0823 lr: 5.99e-05 mem: 47% pow: 664.04 W 0: INFO 26-04-29 05:10:16.981517 - 3:52:45 - step: 9770 acc: 0 loss: 1.382 grad: 1.50e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6232 data: 0.0652 lr: 5.99e-05 mem: 47% pow: 653.788 W 0: INFO 26-04-29 05:10:30.759466 - 3:52:59 - step: 9780 acc: 0 loss: 1.4444 grad: 1.55e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6314 data: 0.0535 lr: 5.98e-05 mem: 47% pow: 655.119 W 0: INFO 26-04-29 05:10:44.430203 - 3:53:13 - step: 9790 acc: 0 loss: 1.676 grad: 1.41e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.626 data: 0.0667 lr: 5.98e-05 mem: 47% pow: 666.231 W 0: INFO 26-04-29 05:10:58.593420 - 3:53:27 - step: 9800 acc: 0 loss: 1.5802 grad: 1.45e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.8871 data: 0.0691 lr: 5.98e-05 mem: 47% pow: 499.782 W 0: INFO 26-04-29 05:11:14.995671 - 3:53:43 - step: 9810 acc: 0 loss: 1.4256 grad: 1.41e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.6129 data: 0.0772 lr: 5.98e-05 mem: 54% pow: 653.878 W 0: INFO 26-04-29 05:11:28.707453 - 3:53:57 - step: 9820 acc: 0 loss: 1.5159 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6189 data: 0.0735 lr: 5.98e-05 mem: 47% pow: 654.223 W 0: INFO 26-04-29 05:11:42.239569 - 3:54:10 - step: 9830 acc: 0 loss: 1.5387 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6187 data: 0.0675 lr: 5.98e-05 mem: 47% pow: 645.02 W 0: INFO 26-04-29 05:11:55.843947 - 3:54:24 - step: 9840 acc: 0 loss: 1.5185 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.604 data: 0.0688 lr: 5.98e-05 mem: 47% pow: 671.11 W 0: INFO 26-04-29 05:12:09.799901 - 3:54:38 - step: 9850 acc: 0 loss: 1.7096 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6619 data: 0.0618 lr: 5.97e-05 mem: 47% pow: 631.541 W 0: INFO 26-04-29 05:12:23.597187 - 3:54:52 - step: 9860 acc: 0 loss: 1.6059 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6913 data: 0.0716 lr: 5.97e-05 mem: 47% pow: 600.781 W 0: INFO 26-04-29 05:12:37.341681 - 3:55:05 - step: 9870 acc: 0 loss: 1.4278 grad: 1.40e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6028 data: 0.085 lr: 5.97e-05 mem: 47% pow: 654.258 W 0: INFO 26-04-29 05:12:51.004896 - 3:55:19 - step: 9880 acc: 0 loss: 1.5045 grad: 1.52e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6567 data: 0.0627 lr: 5.97e-05 mem: 47% pow: 626.443 W 0: INFO 26-04-29 05:13:04.726550 - 3:55:33 - step: 9890 acc: 0 loss: 1.5515 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6248 data: 0.0768 lr: 5.97e-05 mem: 47% pow: 644.36 W 0: INFO 26-04-29 05:13:18.426669 - 3:55:47 - step: 9900 acc: 0 loss: 1.562 grad: 1.43e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6028 data: 0.0838 lr: 5.97e-05 mem: 47% pow: 660.728 W 0: INFO 26-04-29 05:13:34.797874 - 3:56:03 - step: 9910 acc: 0 loss: 1.6176 grad: 1.48e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.6086 data: 0.0808 lr: 5.97e-05 mem: 54% pow: 659.47 W 0: INFO 26-04-29 05:13:48.357305 - 3:56:16 - step: 9920 acc: 0 loss: 1.2211 grad: 1.58e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6113 data: 0.0729 lr: 5.96e-05 mem: 47% pow: 659.639 W 0: INFO 26-04-29 05:14:02.177028 - 3:56:30 - step: 9930 acc: 0 loss: 1.3709 grad: 1.52e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6085 data: 0.0741 lr: 5.96e-05 mem: 47% pow: 655.16 W 0: INFO 26-04-29 05:14:15.717128 - 3:56:44 - step: 9940 acc: 0 loss: 1.5819 grad: 1.59e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6645 data: 0.075 lr: 5.96e-05 mem: 47% pow: 618.27 W 0: INFO 26-04-29 05:14:29.513987 - 3:56:58 - step: 9950 acc: 0 loss: 1.469 grad: 1.54e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.609 data: 0.0833 lr: 5.96e-05 mem: 47% pow: 664.5 W 0: INFO 26-04-29 05:14:43.018050 - 3:57:11 - step: 9960 acc: 0 loss: 1.6788 grad: 1.55e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6341 data: 0.0491 lr: 5.96e-05 mem: 47% pow: 654.737 W 0: INFO 26-04-29 05:14:56.968687 - 3:57:25 - step: 9970 acc: 0 loss: 1.3894 grad: 1.39e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6181 data: 0.0645 lr: 5.96e-05 mem: 47% pow: 650.188 W 0: INFO 26-04-29 05:15:10.444366 - 3:57:39 - step: 9980 acc: 0 loss: 1.5953 grad: 1.61e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6127 data: 0.0692 lr: 5.96e-05 mem: 47% pow: 653.559 W 0: INFO 26-04-29 05:15:24.362729 - 3:57:52 - step: 9990 acc: 0 loss: 1.5157 grad: 1.56e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6285 data: 0.0718 lr: 5.95e-05 mem: 47% pow: 647.3 W 0: INFO 26-04-29 05:15:37.998766 - 3:58:06 - step: 10000 acc: 0 loss: 1.554 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6421 data: 0.0734 lr: 5.95e-05 mem: 47% pow: 638.386 W 0: INFO 26-04-29 05:15:38.001403 - 3:58:06 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000010000 0: INFO 26-04-29 05:15:38.001744 - 3:58:06 - Saving... 0: INFO 26-04-29 05:15:44.111688 - 3:58:12 - State dict saved! 0: INFO 26-04-29 05:15:44.200022 - 3:58:12 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000010000/train_state_00000.json 0: INFO 26-04-29 05:15:44.203691 - 3:58:12 - Train state saved ! 0: INFO 26-04-29 05:15:44.203940 - 3:58:12 - Cleaning up checkpoints... 0: INFO 26-04-29 05:15:44.204056 - 3:58:12 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000005000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000010000')] 0: INFO 26-04-29 05:15:44.204440 - 3:58:12 - Eval folders: [] 0: INFO 26-04-29 05:15:44.204558 - 3:58:12 - Other folders: [] 0: INFO 26-04-29 05:15:44.204649 - 3:58:12 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000005000')} 0: INFO 26-04-29 05:15:48.345223 - 3:58:16 - garbage collection 0: INFO 26-04-29 05:16:02.717730 - 3:58:31 - step: 10010 acc: 0 loss: 1.6558 grad: 1.48e-01 flops: 2.29e+14 wps: 2.65e+04 iter: 0.6436 data: 0.0704 lr: 5.95e-05 mem: 54% pow: 637.971 W 0: INFO 26-04-29 05:16:16.441437 - 3:58:45 - step: 10020 acc: 0 loss: 1.3462 grad: 1.60e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7074 data: 0.0703 lr: 5.95e-05 mem: 47% pow: 593.228 W 0: INFO 26-04-29 05:16:30.134647 - 3:58:58 - step: 10030 acc: 0 loss: 1.6211 grad: 1.65e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6492 data: 0.0643 lr: 5.95e-05 mem: 47% pow: 636.289 W 0: INFO 26-04-29 05:16:44.018455 - 3:59:12 - step: 10040 acc: 0 loss: 1.8729 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6337 data: 0.0708 lr: 5.95e-05 mem: 47% pow: 641.934 W 0: INFO 26-04-29 05:16:57.518333 - 3:59:26 - step: 10050 acc: 0 loss: 1.3344 grad: 1.55e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6186 data: 0.0642 lr: 5.94e-05 mem: 47% pow: 655.521 W 0: INFO 26-04-29 05:17:11.682095 - 3:59:40 - step: 10060 acc: 0 loss: 1.4383 grad: 1.41e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6163 data: 0.0716 lr: 5.94e-05 mem: 47% pow: 659.14 W 0: INFO 26-04-29 05:17:25.313385 - 3:59:53 - step: 10070 acc: 0 loss: 1.445 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5918 data: 0.0883 lr: 5.94e-05 mem: 47% pow: 656.69 W 0: INFO 26-04-29 05:17:39.000452 - 4:00:07 - step: 10080 acc: 0 loss: 1.4842 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6197 data: 0.0663 lr: 5.94e-05 mem: 47% pow: 654.438 W 0: INFO 26-04-29 05:17:52.752412 - 4:00:21 - step: 10090 acc: 0 loss: 1.916 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.627 data: 0.0593 lr: 5.94e-05 mem: 47% pow: 651.379 W 0: INFO 26-04-29 05:18:06.574117 - 4:00:35 - step: 10100 acc: 0 loss: 1.7651 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6144 data: 0.0732 lr: 5.94e-05 mem: 47% pow: 650.158 W 0: INFO 26-04-29 05:18:23.045398 - 4:00:51 - step: 10110 acc: 0 loss: 1.4592 grad: 1.55e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6114 data: 0.0672 lr: 5.94e-05 mem: 54% pow: 660.054 W 0: INFO 26-04-29 05:18:36.761908 - 4:01:05 - step: 10120 acc: 0 loss: 1.3321 grad: 1.70e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6138 data: 0.0666 lr: 5.93e-05 mem: 47% pow: 654.299 W 0: INFO 26-04-29 05:18:50.418901 - 4:01:19 - step: 10130 acc: 0 loss: 1.4284 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6348 data: 0.0487 lr: 5.93e-05 mem: 47% pow: 651.291 W 0: INFO 26-04-29 05:19:04.312511 - 4:01:32 - step: 10140 acc: 0 loss: 1.3373 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6512 data: 0.0647 lr: 5.93e-05 mem: 47% pow: 638.92 W 0: INFO 26-04-29 05:19:17.963648 - 4:01:46 - step: 10150 acc: 0 loss: 1.4385 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6184 data: 0.0696 lr: 5.93e-05 mem: 47% pow: 663.605 W 0: INFO 26-04-29 05:19:31.409543 - 4:01:59 - step: 10160 acc: 0 loss: 1.5557 grad: 2.01e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6093 data: 0.0608 lr: 5.93e-05 mem: 47% pow: 661.18 W 0: INFO 26-04-29 05:19:45.300013 - 4:02:13 - step: 10170 acc: 0 loss: 1.686 grad: 1.44e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6124 data: 0.071 lr: 5.93e-05 mem: 47% pow: 665.068 W 0: INFO 26-04-29 05:19:58.795089 - 4:02:27 - step: 10180 acc: 0 loss: 1.6169 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.578 data: 0.0937 lr: 5.93e-05 mem: 47% pow: 669.039 W 0: INFO 26-04-29 05:20:12.369336 - 4:02:40 - step: 10190 acc: 0 loss: 1.4625 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6015 data: 0.0844 lr: 5.92e-05 mem: 47% pow: 653.538 W 0: INFO 26-04-29 05:20:25.949582 - 4:02:54 - step: 10200 acc: 0 loss: 1.5032 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5931 data: 0.0749 lr: 5.92e-05 mem: 47% pow: 667.785 W 0: INFO 26-04-29 05:20:42.860594 - 4:03:11 - step: 10210 acc: 0 loss: 1.6507 grad: 1.49e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6328 data: 0.0663 lr: 5.92e-05 mem: 54% pow: 639.335 W 0: INFO 26-04-29 05:20:56.715098 - 4:03:25 - step: 10220 acc: 0 loss: 1.3494 grad: 1.43e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6067 data: 0.0723 lr: 5.92e-05 mem: 47% pow: 652.753 W 0: INFO 26-04-29 05:21:10.305531 - 4:03:38 - step: 10230 acc: 0 loss: 1.2526 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.669 data: 0.0756 lr: 5.92e-05 mem: 47% pow: 620.923 W 0: INFO 26-04-29 05:21:24.058055 - 4:03:52 - step: 10240 acc: 0 loss: 1.381 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6471 data: 0.0736 lr: 5.92e-05 mem: 47% pow: 629.388 W 0: INFO 26-04-29 05:21:37.901322 - 4:04:06 - step: 10250 acc: 0 loss: 1.3705 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6182 data: 0.0688 lr: 5.91e-05 mem: 47% pow: 660.355 W 0: INFO 26-04-29 05:21:51.678639 - 4:04:20 - step: 10260 acc: 0 loss: 1.778 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6229 data: 0.0788 lr: 5.91e-05 mem: 47% pow: 645.281 W 0: INFO 26-04-29 05:22:07.017184 - 4:04:35 - step: 10270 acc: 0 loss: 1.4672 grad: 1.51e-01 flops: 3.68e+14 wps: 4.27e+04 iter: 0.6261 data: 0.0731 lr: 5.91e-05 mem: 47% pow: 640.119 W 0: INFO 26-04-29 05:22:20.598268 - 4:04:49 - step: 10280 acc: 0 loss: 1.093 grad: 1.43e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6059 data: 0.07 lr: 5.91e-05 mem: 47% pow: 678.37 W 0: INFO 26-04-29 05:22:34.077092 - 4:05:02 - step: 10290 acc: 0 loss: 1.5154 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6053 data: 0.0704 lr: 5.91e-05 mem: 47% pow: 658.154 W 0: INFO 26-04-29 05:22:47.470347 - 4:05:16 - step: 10300 acc: 0 loss: 1.6867 grad: 1.44e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5937 data: 0.0724 lr: 5.91e-05 mem: 47% pow: 664.264 W 0: INFO 26-04-29 05:23:04.000960 - 4:05:32 - step: 10310 acc: 0 loss: 1.454 grad: 1.47e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6143 data: 0.069 lr: 5.91e-05 mem: 54% pow: 652.303 W 0: INFO 26-04-29 05:23:17.499527 - 4:05:46 - step: 10320 acc: 0 loss: 1.5461 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6677 data: 0.0696 lr: 5.90e-05 mem: 47% pow: 626.14 W 0: INFO 26-04-29 05:23:31.097793 - 4:05:59 - step: 10330 acc: 0 loss: 1.6539 grad: 1.65e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6172 data: 0.0815 lr: 5.90e-05 mem: 47% pow: 638.208 W 0: INFO 26-04-29 05:23:44.725043 - 4:06:13 - step: 10340 acc: 0 loss: 1.4088 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6229 data: 0.0681 lr: 5.90e-05 mem: 47% pow: 656.023 W 0: INFO 26-04-29 05:23:58.308500 - 4:06:26 - step: 10350 acc: 0 loss: 1.6188 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.615 data: 0.0861 lr: 5.90e-05 mem: 47% pow: 662.474 W 0: INFO 26-04-29 05:24:11.835023 - 4:06:40 - step: 10360 acc: 0 loss: 1.4309 grad: 1.43e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6196 data: 0.0764 lr: 5.90e-05 mem: 47% pow: 647.45 W 0: INFO 26-04-29 05:24:25.384468 - 4:06:53 - step: 10370 acc: 0 loss: 1.5238 grad: 1.55e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6216 data: 0.0648 lr: 5.90e-05 mem: 47% pow: 657.173 W 0: INFO 26-04-29 05:24:38.961028 - 4:07:07 - step: 10380 acc: 0 loss: 1.4333 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6246 data: 0.0587 lr: 5.90e-05 mem: 47% pow: 651.828 W 0: INFO 26-04-29 05:24:52.732007 - 4:07:21 - step: 10390 acc: 0 loss: 1.4517 grad: 1.43e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6 data: 0.0669 lr: 5.89e-05 mem: 47% pow: 663.6 W 0: INFO 26-04-29 05:25:07.612789 - 4:07:36 - step: 10400 acc: 0 loss: 1.7568 grad: 1.84e-01 flops: 3.80e+14 wps: 4.40e+04 iter: 0.6305 data: 0.0468 lr: 5.89e-05 mem: 47% pow: 659.299 W 0: INFO 26-04-29 05:25:24.548236 - 4:07:53 - step: 10410 acc: 0 loss: 1.4491 grad: 1.58e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6041 data: 0.0693 lr: 5.89e-05 mem: 54% pow: 662.939 W 0: INFO 26-04-29 05:25:38.232784 - 4:08:06 - step: 10420 acc: 0 loss: 1.4393 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6366 data: 0.069 lr: 5.89e-05 mem: 47% pow: 650.572 W 0: INFO 26-04-29 05:25:51.835971 - 4:08:20 - step: 10430 acc: 0 loss: 1.751 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6185 data: 0.074 lr: 5.89e-05 mem: 47% pow: 646.735 W 0: INFO 26-04-29 05:26:05.941358 - 4:08:34 - step: 10440 acc: 0 loss: 1.3544 grad: 1.49e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6172 data: 0.072 lr: 5.89e-05 mem: 47% pow: 654.532 W 0: INFO 26-04-29 05:26:19.850997 - 4:08:48 - step: 10450 acc: 0 loss: 1.8341 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.648 data: 0.0682 lr: 5.89e-05 mem: 47% pow: 635.817 W 0: INFO 26-04-29 05:26:33.414917 - 4:09:01 - step: 10460 acc: 0 loss: 1.1146 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6342 data: 0.076 lr: 5.88e-05 mem: 47% pow: 636.068 W 0: INFO 26-04-29 05:26:47.605221 - 4:09:16 - step: 10470 acc: 0 loss: 1.3887 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6162 data: 0.0722 lr: 5.88e-05 mem: 47% pow: 649.321 W 0: INFO 26-04-29 05:27:01.264402 - 4:09:29 - step: 10480 acc: 0 loss: 1.2182 grad: 1.43e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6541 data: 0.0465 lr: 5.88e-05 mem: 47% pow: 643.891 W 0: INFO 26-04-29 05:27:14.892567 - 4:09:43 - step: 10490 acc: 0 loss: 1.4848 grad: 1.57e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.619 data: 0.0591 lr: 5.88e-05 mem: 47% pow: 656.464 W 0: INFO 26-04-29 05:27:28.768349 - 4:09:57 - step: 10500 acc: 0 loss: 1.471 grad: 1.47e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6145 data: 0.0739 lr: 5.88e-05 mem: 47% pow: 659.356 W 0: INFO 26-04-29 05:27:45.892349 - 4:10:14 - step: 10510 acc: 0 loss: 1.669 grad: 1.62e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6098 data: 0.0754 lr: 5.88e-05 mem: 54% pow: 660.823 W 0: INFO 26-04-29 05:27:59.779717 - 4:10:28 - step: 10520 acc: 0 loss: 1.3332 grad: 1.51e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7885 data: 0.0707 lr: 5.87e-05 mem: 47% pow: 559.743 W 0: INFO 26-04-29 05:28:13.777036 - 4:10:42 - step: 10530 acc: 0 loss: 1.3679 grad: 1.63e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6104 data: 0.0703 lr: 5.87e-05 mem: 47% pow: 653.906 W 0: INFO 26-04-29 05:28:27.793474 - 4:10:56 - step: 10540 acc: 0 loss: 1.6814 grad: 1.47e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5988 data: 0.08 lr: 5.87e-05 mem: 47% pow: 653.062 W 0: INFO 26-04-29 05:28:41.532711 - 4:11:10 - step: 10550 acc: 0 loss: 1.6491 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6024 data: 0.0855 lr: 5.87e-05 mem: 47% pow: 663.165 W 0: INFO 26-04-29 05:28:55.501997 - 4:11:24 - step: 10560 acc: 0 loss: 1.7802 grad: 1.48e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6982 data: 0.0456 lr: 5.87e-05 mem: 47% pow: 612.089 W 0: INFO 26-04-29 05:29:09.033214 - 4:11:37 - step: 10570 acc: 0 loss: 1.9089 grad: 1.46e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6226 data: 0.0849 lr: 5.87e-05 mem: 47% pow: 646.563 W 0: INFO 26-04-29 05:29:22.730759 - 4:11:51 - step: 10580 acc: 0 loss: 1.7266 grad: 1.53e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6159 data: 0.0741 lr: 5.87e-05 mem: 47% pow: 654.999 W 0: INFO 26-04-29 05:29:36.338837 - 4:12:04 - step: 10590 acc: 0 loss: 1.4657 grad: 1.46e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6102 data: 0.0732 lr: 5.86e-05 mem: 47% pow: 651.813 W 0: INFO 26-04-29 05:29:50.150396 - 4:12:18 - step: 10600 acc: 0 loss: 1.4949 grad: 1.39e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.598 data: 0.0734 lr: 5.86e-05 mem: 47% pow: 663.524 W 0: INFO 26-04-29 05:30:07.017917 - 4:12:35 - step: 10610 acc: 0 loss: 1.2046 grad: 1.53e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.7091 data: 0.0801 lr: 5.86e-05 mem: 54% pow: 603.725 W 0: INFO 26-04-29 05:30:20.649752 - 4:12:49 - step: 10620 acc: 0 loss: 1.6164 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6173 data: 0.0729 lr: 5.86e-05 mem: 47% pow: 655.659 W 0: INFO 26-04-29 05:30:34.222959 - 4:13:02 - step: 10630 acc: 0 loss: 1.5258 grad: 1.48e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6286 data: 0.0706 lr: 5.86e-05 mem: 47% pow: 641.37 W 0: INFO 26-04-29 05:30:48.020256 - 4:13:16 - step: 10640 acc: 0 loss: 1.7681 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6314 data: 0.0772 lr: 5.86e-05 mem: 47% pow: 643.561 W 0: INFO 26-04-29 05:31:01.981450 - 4:13:30 - step: 10650 acc: 0 loss: 1.492 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7302 data: 0.0682 lr: 5.86e-05 mem: 47% pow: 592.138 W 0: INFO 26-04-29 05:31:16.022041 - 4:13:44 - step: 10660 acc: 0 loss: 1.164 grad: 1.50e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6535 data: 0.0703 lr: 5.85e-05 mem: 47% pow: 634.187 W 0: INFO 26-04-29 05:31:30.209300 - 4:13:58 - step: 10670 acc: 0 loss: 1.3729 grad: 1.51e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6454 data: 0.063 lr: 5.85e-05 mem: 47% pow: 637.867 W 0: INFO 26-04-29 05:31:44.339382 - 4:14:12 - step: 10680 acc: 0 loss: 1.3641 grad: 1.50e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6345 data: 0.0694 lr: 5.85e-05 mem: 47% pow: 641.866 W 0: INFO 26-04-29 05:31:58.477579 - 4:14:27 - step: 10690 acc: 0 loss: 1.3205 grad: 1.45e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6091 data: 0.0688 lr: 5.85e-05 mem: 47% pow: 653.544 W 0: INFO 26-04-29 05:32:12.588907 - 4:14:41 - step: 10700 acc: 0 loss: 1.4902 grad: 1.49e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6086 data: 0.0785 lr: 5.85e-05 mem: 47% pow: 656.306 W 0: INFO 26-04-29 05:32:29.864926 - 4:14:58 - step: 10710 acc: 0 loss: 1.5071 grad: 1.44e-01 flops: 3.27e+14 wps: 3.79e+04 iter: 0.7165 data: 0.0737 lr: 5.85e-05 mem: 54% pow: 600.293 W 0: INFO 26-04-29 05:32:43.944759 - 4:15:12 - step: 10720 acc: 0 loss: 1.2778 grad: 1.45e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6182 data: 0.0712 lr: 5.85e-05 mem: 47% pow: 652.815 W 0: INFO 26-04-29 05:32:57.937960 - 4:15:26 - step: 10730 acc: 0 loss: 1.6571 grad: 1.48e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6353 data: 0.0709 lr: 5.84e-05 mem: 47% pow: 657.416 W 0: INFO 26-04-29 05:33:11.601289 - 4:15:40 - step: 10740 acc: 0 loss: 1.1561 grad: 1.41e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6336 data: 0.0718 lr: 5.84e-05 mem: 47% pow: 648.799 W 0: INFO 26-04-29 05:33:25.570454 - 4:15:54 - step: 10750 acc: 0 loss: 1.3506 grad: 1.43e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6237 data: 0.0672 lr: 5.84e-05 mem: 47% pow: 649.281 W 0: INFO 26-04-29 05:33:40.165714 - 4:16:08 - step: 10760 acc: 0 loss: 1.5145 grad: 1.51e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6596 data: 0.0654 lr: 5.84e-05 mem: 47% pow: 622.706 W 0: INFO 26-04-29 05:33:54.777219 - 4:16:23 - step: 10770 acc: 0 loss: 1.376 grad: 1.58e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6121 data: 0.0692 lr: 5.84e-05 mem: 47% pow: 650.605 W 0: INFO 26-04-29 05:34:09.585585 - 4:16:38 - step: 10780 acc: 0 loss: 1.464 grad: 1.67e-01 flops: 3.81e+14 wps: 4.43e+04 iter: 0.6512 data: 0.058 lr: 5.84e-05 mem: 47% pow: 636.974 W 0: INFO 26-04-29 05:34:23.690984 - 4:16:52 - step: 10790 acc: 0 loss: 1.7015 grad: 1.52e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6324 data: 0.0706 lr: 5.83e-05 mem: 47% pow: 642.98 W 0: INFO 26-04-29 05:34:38.391186 - 4:17:06 - step: 10800 acc: 0 loss: 1.4608 grad: 1.58e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6894 data: 0.0681 lr: 5.83e-05 mem: 47% pow: 619.438 W 0: INFO 26-04-29 05:34:55.534116 - 4:17:24 - step: 10810 acc: 0 loss: 1.8467 grad: 1.48e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6863 data: 0.0692 lr: 5.83e-05 mem: 54% pow: 606.35 W 0: INFO 26-04-29 05:35:09.507450 - 4:17:38 - step: 10820 acc: 0 loss: 1.5875 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6163 data: 0.0688 lr: 5.83e-05 mem: 47% pow: 670.645 W 0: INFO 26-04-29 05:35:23.498674 - 4:17:52 - step: 10830 acc: 0 loss: 1.6456 grad: 1.49e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6345 data: 0.0672 lr: 5.83e-05 mem: 47% pow: 637.429 W 0: INFO 26-04-29 05:35:38.321460 - 4:18:06 - step: 10840 acc: 0 loss: 1.4064 grad: 1.45e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.7117 data: 0.0858 lr: 5.83e-05 mem: 47% pow: 586.929 W 0: INFO 26-04-29 05:35:53.588379 - 4:18:22 - step: 10850 acc: 0 loss: 2.0255 grad: 1.42e-01 flops: 3.70e+14 wps: 4.30e+04 iter: 0.6595 data: 0.0641 lr: 5.83e-05 mem: 47% pow: 631.342 W 0: INFO 26-04-29 05:36:08.138273 - 4:18:36 - step: 10860 acc: 0 loss: 1.7752 grad: 1.54e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6075 data: 0.0819 lr: 5.82e-05 mem: 47% pow: 656.404 W 0: INFO 26-04-29 05:36:23.069247 - 4:18:51 - step: 10870 acc: 0 loss: 1.5225 grad: 1.50e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.8141 data: 0.073 lr: 5.82e-05 mem: 47% pow: 544.025 W 0: INFO 26-04-29 05:36:37.347222 - 4:19:05 - step: 10880 acc: 0 loss: 1.6749 grad: 1.63e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.715 data: 0.0727 lr: 5.82e-05 mem: 47% pow: 603.372 W 0: INFO 26-04-29 05:36:51.141175 - 4:19:19 - step: 10890 acc: 0 loss: 1.4359 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6083 data: 0.0754 lr: 5.82e-05 mem: 47% pow: 656.638 W 0: INFO 26-04-29 05:37:05.781223 - 4:19:34 - step: 10900 acc: 0 loss: 1.8256 grad: 1.50e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.8762 data: 0.0633 lr: 5.82e-05 mem: 47% pow: 505.943 W 0: INFO 26-04-29 05:37:23.118511 - 4:19:51 - step: 10910 acc: 0 loss: 1.7287 grad: 1.51e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.7506 data: 0.0488 lr: 5.82e-05 mem: 54% pow: 593.041 W 0: INFO 26-04-29 05:37:37.166800 - 4:20:05 - step: 10920 acc: 0 loss: 1.4803 grad: 1.54e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6406 data: 0.0697 lr: 5.82e-05 mem: 47% pow: 639.061 W 0: INFO 26-04-29 05:37:51.442042 - 4:20:20 - step: 10930 acc: 0 loss: 1.8592 grad: 1.53e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.7317 data: 0.0524 lr: 5.81e-05 mem: 47% pow: 590.246 W 0: INFO 26-04-29 05:38:05.433153 - 4:20:34 - step: 10940 acc: 0 loss: 2.1188 grad: 1.49e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6441 data: 0.0704 lr: 5.81e-05 mem: 47% pow: 632.867 W 0: INFO 26-04-29 05:38:19.729880 - 4:20:48 - step: 10950 acc: 0 loss: 1.5866 grad: 1.57e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6679 data: 0.0727 lr: 5.81e-05 mem: 47% pow: 615.465 W 0: INFO 26-04-29 05:38:34.367581 - 4:21:02 - step: 10960 acc: 0 loss: 1.6456 grad: 1.53e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6556 data: 0.0668 lr: 5.81e-05 mem: 47% pow: 644.186 W 0: INFO 26-04-29 05:38:49.350775 - 4:21:17 - step: 10970 acc: 0 loss: 1.405 grad: 1.48e-01 flops: 3.77e+14 wps: 4.38e+04 iter: 0.6557 data: 0.0511 lr: 5.81e-05 mem: 47% pow: 655.391 W 0: INFO 26-04-29 05:39:03.973487 - 4:21:32 - step: 10980 acc: 0 loss: 1.407 grad: 1.51e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6965 data: 0.0711 lr: 5.81e-05 mem: 47% pow: 611.877 W 0: INFO 26-04-29 05:39:18.344369 - 4:21:46 - step: 10990 acc: 0 loss: 1.6377 grad: 1.51e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.7054 data: 0.0675 lr: 5.80e-05 mem: 47% pow: 577.731 W 0: INFO 26-04-29 05:39:35.997209 - 4:22:04 - step: 11000 acc: 0 loss: 1.4812 grad: 1.45e-01 flops: 3.20e+14 wps: 3.71e+04 iter: 0.635 data: 0.0795 lr: 5.80e-05 mem: 47% pow: 625.466 W 0: INFO 26-04-29 05:39:39.668957 - 4:22:08 - garbage collection 0: INFO 26-04-29 05:39:54.716904 - 4:22:23 - step: 11010 acc: 0 loss: 1.6249 grad: 1.46e-01 flops: 3.02e+14 wps: 3.50e+04 iter: 0.6301 data: 0.0721 lr: 5.80e-05 mem: 54% pow: 640.944 W 0: INFO 26-04-29 05:40:08.892710 - 4:22:37 - step: 11020 acc: 0 loss: 1.3847 grad: 1.59e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6038 data: 0.0681 lr: 5.80e-05 mem: 47% pow: 654.602 W 0: INFO 26-04-29 05:40:23.026830 - 4:22:51 - step: 11030 acc: 0 loss: 1.5991 grad: 1.58e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5773 data: 0.1221 lr: 5.80e-05 mem: 47% pow: 665.58 W 0: INFO 26-04-29 05:40:37.753262 - 4:23:06 - step: 11040 acc: 0 loss: 1.4577 grad: 1.45e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.6321 data: 0.0737 lr: 5.80e-05 mem: 47% pow: 638.03 W 0: INFO 26-04-29 05:40:52.191977 - 4:23:20 - step: 11050 acc: 0 loss: 1.6446 grad: 1.52e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6364 data: 0.0796 lr: 5.80e-05 mem: 47% pow: 634.587 W 0: INFO 26-04-29 05:41:06.395567 - 4:23:34 - step: 11060 acc: 0 loss: 1.7745 grad: 1.50e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.8251 data: 0.0466 lr: 5.79e-05 mem: 47% pow: 546.247 W 0: INFO 26-04-29 05:41:21.289890 - 4:23:49 - step: 11070 acc: 0 loss: 1.3747 grad: 1.53e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.8978 data: 0.0582 lr: 5.79e-05 mem: 47% pow: 508.663 W 0: INFO 26-04-29 05:41:35.476661 - 4:24:04 - step: 11080 acc: 0 loss: 1.5206 grad: 1.46e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6138 data: 0.0713 lr: 5.79e-05 mem: 47% pow: 657.02 W 0: INFO 26-04-29 05:41:49.621885 - 4:24:18 - step: 11090 acc: 0 loss: 1.2579 grad: 1.60e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6619 data: 0.0783 lr: 5.79e-05 mem: 47% pow: 616.559 W 0: INFO 26-04-29 05:42:04.025782 - 4:24:32 - step: 11100 acc: 0 loss: 1.3926 grad: 1.63e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6947 data: 0.071 lr: 5.79e-05 mem: 47% pow: 612.395 W 0: INFO 26-04-29 05:42:21.387006 - 4:24:49 - step: 11110 acc: 0 loss: 1.5451 grad: 1.55e-01 flops: 3.25e+14 wps: 3.78e+04 iter: 0.6357 data: 0.067 lr: 5.79e-05 mem: 54% pow: 644.15 W 0: INFO 26-04-29 05:42:35.318131 - 4:25:03 - step: 11120 acc: 0 loss: 1.6658 grad: 1.54e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.7172 data: 0.0645 lr: 5.79e-05 mem: 47% pow: 593.773 W 0: INFO 26-04-29 05:42:49.357845 - 4:25:17 - step: 11130 acc: 0 loss: 1.2984 grad: 1.48e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.8517 data: 0.0653 lr: 5.78e-05 mem: 47% pow: 518.59 W 0: INFO 26-04-29 05:43:03.492950 - 4:25:32 - step: 11140 acc: 0 loss: 1.4374 grad: 1.53e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6423 data: 0.0745 lr: 5.78e-05 mem: 47% pow: 630.088 W 0: INFO 26-04-29 05:43:17.711229 - 4:25:46 - step: 11150 acc: 0 loss: 1.5846 grad: 1.53e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6163 data: 0.067 lr: 5.78e-05 mem: 47% pow: 653.47 W 0: INFO 26-04-29 05:43:32.568345 - 4:26:01 - step: 11160 acc: 0 loss: 1.5198 grad: 1.47e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.6208 data: 0.071 lr: 5.78e-05 mem: 47% pow: 646.896 W 0: INFO 26-04-29 05:43:46.421374 - 4:26:15 - step: 11170 acc: 0 loss: 1.7721 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6571 data: 0.0756 lr: 5.78e-05 mem: 47% pow: 625.907 W 0: INFO 26-04-29 05:44:00.669507 - 4:26:29 - step: 11180 acc: 0 loss: 1.9092 grad: 1.43e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6499 data: 0.0728 lr: 5.78e-05 mem: 47% pow: 641.279 W 0: INFO 26-04-29 05:44:14.649462 - 4:26:43 - step: 11190 acc: 0 loss: 1.5284 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6849 data: 0.0227 lr: 5.78e-05 mem: 47% pow: 633.886 W 0: INFO 26-04-29 05:44:28.581597 - 4:26:57 - step: 11200 acc: 0 loss: 1.587 grad: 1.56e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6307 data: 0.0835 lr: 5.77e-05 mem: 47% pow: 642.794 W 0: INFO 26-04-29 05:44:45.643211 - 4:27:14 - step: 11210 acc: 0 loss: 1.6587 grad: 1.50e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.8072 data: 0.0606 lr: 5.77e-05 mem: 54% pow: 549.221 W 0: INFO 26-04-29 05:45:00.045781 - 4:27:28 - step: 11220 acc: 0 loss: 1.591 grad: 1.50e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6164 data: 0.0659 lr: 5.77e-05 mem: 47% pow: 652.487 W 0: INFO 26-04-29 05:45:14.472210 - 4:27:43 - step: 11230 acc: 0 loss: 1.6771 grad: 1.60e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.5789 data: 0.218 lr: 5.77e-05 mem: 47% pow: 581.989 W 0: INFO 26-04-29 05:45:28.689286 - 4:27:57 - step: 11240 acc: 0 loss: 1.6609 grad: 1.63e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6584 data: 0.0662 lr: 5.77e-05 mem: 47% pow: 617.452 W 0: INFO 26-04-29 05:45:43.382303 - 4:28:11 - step: 11250 acc: 0 loss: 1.7774 grad: 1.54e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.5785 data: 0.1942 lr: 5.77e-05 mem: 47% pow: 600.067 W 0: INFO 26-04-29 05:45:57.514313 - 4:28:26 - step: 11260 acc: 0 loss: 1.6236 grad: 1.55e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6155 data: 0.0743 lr: 5.76e-05 mem: 47% pow: 643.821 W 0: INFO 26-04-29 05:46:12.260417 - 4:28:40 - step: 11270 acc: 0 loss: 1.6653 grad: 1.59e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6267 data: 0.077 lr: 5.76e-05 mem: 47% pow: 639.421 W 0: INFO 26-04-29 05:46:26.840966 - 4:28:55 - step: 11280 acc: 0 loss: 1.9499 grad: 1.59e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.8165 data: 0.0674 lr: 5.76e-05 mem: 47% pow: 540.667 W 0: INFO 26-04-29 05:46:41.094006 - 4:29:09 - step: 11290 acc: 0 loss: 1.4911 grad: 1.66e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5876 data: 0.0858 lr: 5.76e-05 mem: 47% pow: 667.776 W 0: INFO 26-04-29 05:46:55.750518 - 4:29:24 - step: 11300 acc: 0 loss: 1.6865 grad: 1.54e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.7065 data: 0.0651 lr: 5.76e-05 mem: 47% pow: 605.707 W 0: INFO 26-04-29 05:47:13.051995 - 4:29:41 - step: 11310 acc: 0 loss: 1.8535 grad: 1.58e-01 flops: 3.26e+14 wps: 3.79e+04 iter: 0.657 data: 0.0733 lr: 5.76e-05 mem: 54% pow: 623.111 W 0: INFO 26-04-29 05:47:27.404793 - 4:29:55 - step: 11320 acc: 0 loss: 1.6795 grad: 1.62e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6497 data: 0.073 lr: 5.76e-05 mem: 47% pow: 645.072 W 0: INFO 26-04-29 05:47:41.655059 - 4:30:10 - step: 11330 acc: 0 loss: 1.8171 grad: 1.58e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6196 data: 0.0594 lr: 5.75e-05 mem: 47% pow: 656.79 W 0: INFO 26-04-29 05:47:55.813742 - 4:30:24 - step: 11340 acc: 0 loss: 1.655 grad: 1.59e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6338 data: 0.0596 lr: 5.75e-05 mem: 47% pow: 656.598 W 0: INFO 26-04-29 05:48:10.056306 - 4:30:38 - step: 11350 acc: 0 loss: 1.7418 grad: 1.61e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6925 data: 0.0681 lr: 5.75e-05 mem: 47% pow: 607.866 W 0: INFO 26-04-29 05:48:24.569190 - 4:30:53 - step: 11360 acc: 0 loss: 1.968 grad: 1.73e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6136 data: 0.0741 lr: 5.75e-05 mem: 47% pow: 661.336 W 0: INFO 26-04-29 05:48:38.530335 - 4:31:07 - step: 11370 acc: 0 loss: 2.0647 grad: 4.38e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6916 data: 0.0593 lr: 5.75e-05 mem: 47% pow: 614.606 W 0: INFO 26-04-29 05:48:52.327501 - 4:31:20 - step: 11380 acc: 0 loss: 1.775 grad: 1.65e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6324 data: 0.0588 lr: 5.75e-05 mem: 47% pow: 651.026 W 0: INFO 26-04-29 05:49:07.530502 - 4:31:36 - step: 11390 acc: 0 loss: 1.9086 grad: 1.56e-01 flops: 3.71e+14 wps: 4.31e+04 iter: 0.8763 data: 0.0774 lr: 5.75e-05 mem: 47% pow: 503.543 W 0: INFO 26-04-29 05:49:21.893966 - 4:31:50 - step: 11400 acc: 0 loss: 1.5205 grad: 1.68e-01 flops: 3.93e+14 wps: 4.57e+04 iter: 0.7059 data: 0.0444 lr: 5.74e-05 mem: 47% pow: 614.14 W 0: INFO 26-04-29 05:49:42.272367 - 4:32:10 - step: 11410 acc: 0 loss: 1.906 grad: 1.55e-01 flops: 2.93e+14 wps: 3.40e+04 iter: 1.0776 data: 0.0971 lr: 5.74e-05 mem: 54% pow: 461.019 W 0: INFO 26-04-29 05:49:57.988756 - 4:32:26 - step: 11420 acc: 0 loss: 1.6462 grad: 1.61e-01 flops: 3.59e+14 wps: 4.17e+04 iter: 0.6216 data: 0.067 lr: 5.74e-05 mem: 47% pow: 656.735 W 0: INFO 26-04-29 05:50:12.374963 - 4:32:40 - step: 11430 acc: 0 loss: 1.4785 grad: 1.57e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6369 data: 0.0611 lr: 5.74e-05 mem: 47% pow: 641.904 W 0: INFO 26-04-29 05:50:26.729249 - 4:32:55 - step: 11440 acc: 0 loss: 1.9586 grad: 1.63e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6172 data: 0.0697 lr: 5.74e-05 mem: 47% pow: 658.015 W 0: INFO 26-04-29 05:50:40.939846 - 4:33:09 - step: 11450 acc: 0 loss: 1.6611 grad: 1.54e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6283 data: 0.074 lr: 5.74e-05 mem: 47% pow: 639.268 W 0: INFO 26-04-29 05:50:54.977281 - 4:33:23 - step: 11460 acc: 0 loss: 1.3227 grad: 1.55e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6198 data: 0.0907 lr: 5.73e-05 mem: 47% pow: 645.671 W 0: INFO 26-04-29 05:51:08.833422 - 4:33:37 - step: 11470 acc: 0 loss: 1.6167 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6565 data: 0.0596 lr: 5.73e-05 mem: 47% pow: 627.333 W 0: INFO 26-04-29 05:51:22.706893 - 4:33:51 - step: 11480 acc: 0 loss: 2.0354 grad: 1.64e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6131 data: 0.0677 lr: 5.73e-05 mem: 47% pow: 656.589 W 0: INFO 26-04-29 05:51:36.960540 - 4:34:05 - step: 11490 acc: 0 loss: 1.734 grad: 1.68e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6323 data: 0.068 lr: 5.73e-05 mem: 47% pow: 634.146 W 0: INFO 26-04-29 05:51:50.844035 - 4:34:19 - step: 11500 acc: 0 loss: 1.7226 grad: 1.61e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6322 data: 0.0705 lr: 5.73e-05 mem: 47% pow: 636.47 W 0: INFO 26-04-29 05:52:07.802363 - 4:34:36 - step: 11510 acc: 0 loss: 1.6006 grad: 1.54e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6514 data: 0.0728 lr: 5.73e-05 mem: 54% pow: 627.53 W 0: INFO 26-04-29 05:52:21.720746 - 4:34:50 - step: 11520 acc: 0 loss: 2.2631 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.674 data: 0.0683 lr: 5.73e-05 mem: 47% pow: 620.44 W 0: INFO 26-04-29 05:52:35.919421 - 4:35:04 - step: 11530 acc: 0 loss: 1.4222 grad: 1.56e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6681 data: 0.0697 lr: 5.72e-05 mem: 47% pow: 624.247 W 0: INFO 26-04-29 05:52:49.722344 - 4:35:18 - step: 11540 acc: 0 loss: 1.4675 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6068 data: 0.0789 lr: 5.72e-05 mem: 47% pow: 654.218 W 0: INFO 26-04-29 05:53:03.682854 - 4:35:32 - step: 11550 acc: 0 loss: 1.5624 grad: 1.64e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6272 data: 0.0609 lr: 5.72e-05 mem: 47% pow: 651.189 W 0: INFO 26-04-29 05:53:17.410854 - 4:35:45 - step: 11560 acc: 0 loss: 1.381 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6303 data: 0.0639 lr: 5.72e-05 mem: 47% pow: 647.4 W 0: INFO 26-04-29 05:53:30.946266 - 4:35:59 - step: 11570 acc: 0 loss: 1.6386 grad: 1.95e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6565 data: 0.0524 lr: 5.72e-05 mem: 47% pow: 649.07 W 0: INFO 26-04-29 05:53:45.057141 - 4:36:13 - step: 11580 acc: 0 loss: 1.6285 grad: 1.72e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6111 data: 0.1186 lr: 5.72e-05 mem: 47% pow: 626.096 W 0: INFO 26-04-29 05:53:58.894198 - 4:36:27 - step: 11590 acc: 0 loss: 1.6622 grad: 1.67e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6241 data: 0.072 lr: 5.72e-05 mem: 47% pow: 651.648 W 0: INFO 26-04-29 05:54:12.595992 - 4:36:41 - step: 11600 acc: 0 loss: 1.6573 grad: 1.84e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.669 data: 0.082 lr: 5.71e-05 mem: 47% pow: 624.498 W 0: INFO 26-04-29 05:54:29.151835 - 4:36:57 - step: 11610 acc: 0 loss: 2.1939 grad: 1.55e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6219 data: 0.0732 lr: 5.71e-05 mem: 54% pow: 648.134 W 0: INFO 26-04-29 05:54:43.025349 - 4:37:11 - step: 11620 acc: 0 loss: 1.5549 grad: 1.52e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6061 data: 0.0754 lr: 5.71e-05 mem: 47% pow: 652.583 W 0: INFO 26-04-29 05:54:57.549889 - 4:37:26 - step: 11630 acc: 0 loss: 1.6471 grad: 1.70e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6474 data: 0.0666 lr: 5.71e-05 mem: 47% pow: 637.488 W 0: INFO 26-04-29 05:55:11.107923 - 4:37:39 - step: 11640 acc: 0 loss: 1.3433 grad: 1.58e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6133 data: 0.0768 lr: 5.71e-05 mem: 47% pow: 655.581 W 0: INFO 26-04-29 05:55:24.678179 - 4:37:53 - step: 11650 acc: 0 loss: 1.8064 grad: 1.63e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.631 data: 0.069 lr: 5.71e-05 mem: 47% pow: 649.662 W 0: INFO 26-04-29 05:55:38.704834 - 4:38:07 - step: 11660 acc: 0 loss: 2.043 grad: 1.66e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6677 data: 0.0713 lr: 5.71e-05 mem: 47% pow: 613.742 W 0: INFO 26-04-29 05:55:52.516824 - 4:38:21 - step: 11670 acc: 0 loss: 1.7732 grad: 1.83e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6662 data: 0.0703 lr: 5.70e-05 mem: 47% pow: 620.857 W 0: INFO 26-04-29 05:56:06.153521 - 4:38:34 - step: 11680 acc: 0 loss: 1.7234 grad: 1.78e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6408 data: 0.0511 lr: 5.70e-05 mem: 47% pow: 644.824 W 0: INFO 26-04-29 05:56:21.296423 - 4:38:49 - step: 11690 acc: 0 loss: 1.751 grad: 1.67e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.699 data: 0.0685 lr: 5.70e-05 mem: 47% pow: 598.333 W 0: INFO 26-04-29 05:56:34.864796 - 4:39:03 - step: 11700 acc: 0 loss: 1.9848 grad: 1.73e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6485 data: 0.056 lr: 5.70e-05 mem: 47% pow: 640.075 W 0: INFO 26-04-29 05:56:51.325128 - 4:39:19 - step: 11710 acc: 0 loss: 1.1062 grad: 1.52e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.635 data: 0.0713 lr: 5.70e-05 mem: 54% pow: 641.199 W 0: INFO 26-04-29 05:57:05.032602 - 4:39:33 - step: 11720 acc: 0 loss: 1.8915 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6089 data: 0.0855 lr: 5.70e-05 mem: 47% pow: 643.651 W 0: INFO 26-04-29 05:57:18.615293 - 4:39:47 - step: 11730 acc: 0 loss: 1.549 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6281 data: 0.0699 lr: 5.69e-05 mem: 47% pow: 643.088 W 0: INFO 26-04-29 05:57:32.733566 - 4:40:01 - step: 11740 acc: 0 loss: 1.8906 grad: 1.59e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6072 data: 0.0696 lr: 5.69e-05 mem: 47% pow: 652.755 W 0: INFO 26-04-29 05:57:46.616979 - 4:40:15 - step: 11750 acc: 0 loss: 1.7129 grad: 1.66e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6078 data: 0.08 lr: 5.69e-05 mem: 47% pow: 674.526 W 0: INFO 26-04-29 05:58:00.388893 - 4:40:28 - step: 11760 acc: 0 loss: 2.1928 grad: 1.66e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6131 data: 0.0704 lr: 5.69e-05 mem: 47% pow: 649.326 W 0: INFO 26-04-29 05:58:13.920699 - 4:40:42 - step: 11770 acc: 0 loss: 1.3649 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6224 data: 0.0714 lr: 5.69e-05 mem: 47% pow: 651.907 W 0: INFO 26-04-29 05:58:27.652685 - 4:40:56 - step: 11780 acc: 0 loss: 1.9496 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6222 data: 0.0618 lr: 5.69e-05 mem: 47% pow: 652.321 W 0: INFO 26-04-29 05:58:41.174696 - 4:41:09 - step: 11790 acc: 0 loss: 1.4735 grad: 1.66e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6103 data: 0.0673 lr: 5.69e-05 mem: 47% pow: 654.229 W 0: INFO 26-04-29 05:58:54.895670 - 4:41:23 - step: 11800 acc: 0 loss: 2.0775 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.622 data: 0.0717 lr: 5.68e-05 mem: 47% pow: 643.959 W 0: INFO 26-04-29 05:59:11.794440 - 4:41:40 - step: 11810 acc: 0 loss: 1.9793 grad: 1.63e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6437 data: 0.071 lr: 5.68e-05 mem: 54% pow: 637.384 W 0: INFO 26-04-29 05:59:25.452978 - 4:41:54 - step: 11820 acc: 0 loss: 1.4067 grad: 1.63e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6469 data: 0.0666 lr: 5.68e-05 mem: 47% pow: 632.648 W 0: INFO 26-04-29 05:59:39.249487 - 4:42:07 - step: 11830 acc: 0 loss: 1.4345 grad: 4.36e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5819 data: 0.0916 lr: 5.68e-05 mem: 47% pow: 659.501 W 0: INFO 26-04-29 05:59:52.980395 - 4:42:21 - step: 11840 acc: 0 loss: 1.7609 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6648 data: 0.068 lr: 5.68e-05 mem: 47% pow: 622.995 W 0: INFO 26-04-29 06:00:06.983861 - 4:42:35 - step: 11850 acc: 0 loss: 1.9182 grad: 1.66e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6112 data: 0.072 lr: 5.68e-05 mem: 47% pow: 656.608 W 0: INFO 26-04-29 06:00:20.649968 - 4:42:49 - step: 11860 acc: 0 loss: 1.8386 grad: 1.48e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6256 data: 0.0736 lr: 5.68e-05 mem: 47% pow: 646.717 W 0: INFO 26-04-29 06:00:34.275854 - 4:43:02 - step: 11870 acc: 0 loss: 1.6147 grad: 1.65e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6454 data: 0.0705 lr: 5.67e-05 mem: 47% pow: 632.893 W 0: INFO 26-04-29 06:00:47.894913 - 4:43:16 - step: 11880 acc: 0 loss: 1.7734 grad: 1.60e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6461 data: 0.0706 lr: 5.67e-05 mem: 47% pow: 635.288 W 0: INFO 26-04-29 06:01:01.904946 - 4:43:30 - step: 11890 acc: 0 loss: 1.857 grad: 1.64e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6171 data: 0.0688 lr: 5.67e-05 mem: 47% pow: 655.499 W 0: INFO 26-04-29 06:01:15.657570 - 4:43:44 - step: 11900 acc: 0 loss: 1.7097 grad: 1.75e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6342 data: 0.0462 lr: 5.67e-05 mem: 47% pow: 654.73 W 0: INFO 26-04-29 06:01:32.357087 - 4:44:00 - step: 11910 acc: 0 loss: 1.6326 grad: 1.60e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.7057 data: 0.0738 lr: 5.67e-05 mem: 54% pow: 597.734 W 0: INFO 26-04-29 06:01:49.358031 - 4:44:17 - step: 11920 acc: 0 loss: 1.6515 grad: 1.53e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.6066 data: 0.0701 lr: 5.67e-05 mem: 47% pow: 681.232 W 0: INFO 26-04-29 06:02:03.180986 - 4:44:31 - step: 11930 acc: 0 loss: 1.91 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6715 data: 0.0694 lr: 5.66e-05 mem: 47% pow: 620.127 W 0: INFO 26-04-29 06:02:16.933913 - 4:44:45 - step: 11940 acc: 0 loss: 1.5577 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6994 data: 0.0768 lr: 5.66e-05 mem: 47% pow: 601.716 W 0: INFO 26-04-29 06:02:30.635699 - 4:44:59 - step: 11950 acc: 0 loss: 1.5822 grad: 1.67e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6414 data: 0.0724 lr: 5.66e-05 mem: 47% pow: 629.947 W 0: INFO 26-04-29 06:02:44.308247 - 4:45:12 - step: 11960 acc: 0 loss: 1.7539 grad: 1.57e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6179 data: 0.0716 lr: 5.66e-05 mem: 47% pow: 649.764 W 0: INFO 26-04-29 06:02:57.998864 - 4:45:26 - step: 11970 acc: 0 loss: 2.2753 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6142 data: 0.0713 lr: 5.66e-05 mem: 47% pow: 651.217 W 0: INFO 26-04-29 06:03:11.690170 - 4:45:40 - step: 11980 acc: 0 loss: 1.7342 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6608 data: 0.063 lr: 5.66e-05 mem: 47% pow: 636.832 W 0: INFO 26-04-29 06:03:26.259311 - 4:45:54 - step: 11990 acc: 0 loss: 1.6961 grad: 1.58e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6418 data: 0.0569 lr: 5.66e-05 mem: 47% pow: 636.138 W 0: INFO 26-04-29 06:03:40.196003 - 4:46:08 - step: 12000 acc: 0 loss: 1.1631 grad: 1.57e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6143 data: 0.0638 lr: 5.65e-05 mem: 47% pow: 656.293 W 0: INFO 26-04-29 06:03:43.824397 - 4:46:12 - garbage collection 0: INFO 26-04-29 06:03:58.799117 - 4:46:27 - step: 12010 acc: 0 loss: 1.6039 grad: 1.64e-01 flops: 3.04e+14 wps: 3.52e+04 iter: 0.6204 data: 0.0727 lr: 5.65e-05 mem: 54% pow: 649.701 W 0: INFO 26-04-29 06:04:12.650415 - 4:46:41 - step: 12020 acc: 0 loss: 1.7216 grad: 1.52e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6146 data: 0.0727 lr: 5.65e-05 mem: 47% pow: 643.891 W 0: INFO 26-04-29 06:04:26.349593 - 4:46:54 - step: 12030 acc: 0 loss: 1.8252 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6063 data: 0.0739 lr: 5.65e-05 mem: 47% pow: 653.785 W 0: INFO 26-04-29 06:04:40.175244 - 4:47:08 - step: 12040 acc: 0 loss: 1.4043 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.7081 data: 0.0695 lr: 5.65e-05 mem: 47% pow: 600.541 W 0: INFO 26-04-29 06:04:54.257736 - 4:47:22 - step: 12050 acc: 0 loss: 1.8567 grad: 1.53e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6471 data: 0.0728 lr: 5.65e-05 mem: 47% pow: 629.413 W 0: INFO 26-04-29 06:05:08.344785 - 4:47:36 - step: 12060 acc: 0 loss: 1.3324 grad: 1.69e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6659 data: 0.0787 lr: 5.65e-05 mem: 47% pow: 616.994 W 0: INFO 26-04-29 06:05:22.857266 - 4:47:51 - step: 12070 acc: 0 loss: 1.4338 grad: 1.62e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6852 data: 0.0334 lr: 5.64e-05 mem: 47% pow: 626.953 W 0: INFO 26-04-29 06:05:36.540063 - 4:48:05 - step: 12080 acc: 0 loss: 1.7367 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6305 data: 0.0594 lr: 5.64e-05 mem: 47% pow: 658.236 W 0: INFO 26-04-29 06:05:50.413220 - 4:48:18 - step: 12090 acc: 0 loss: 1.7482 grad: 1.55e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6257 data: 0.0689 lr: 5.64e-05 mem: 47% pow: 649.326 W 0: INFO 26-04-29 06:06:04.805774 - 4:48:33 - step: 12100 acc: 0 loss: 1.7876 grad: 1.59e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6214 data: 0.0567 lr: 5.64e-05 mem: 47% pow: 652.71 W 0: INFO 26-04-29 06:06:22.129520 - 4:48:50 - step: 12110 acc: 0 loss: 1.9386 grad: 1.67e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.629 data: 0.0605 lr: 5.64e-05 mem: 54% pow: 654.595 W 0: INFO 26-04-29 06:06:36.360581 - 4:49:04 - step: 12120 acc: 0 loss: 1.5057 grad: 1.48e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6873 data: 0.0709 lr: 5.64e-05 mem: 47% pow: 605.526 W 0: INFO 26-04-29 06:06:50.813960 - 4:49:19 - step: 12130 acc: 0 loss: 1.8946 grad: 1.48e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6479 data: 0.0644 lr: 5.64e-05 mem: 47% pow: 644.731 W 0: INFO 26-04-29 06:07:04.819894 - 4:49:33 - step: 12140 acc: 0 loss: 1.7228 grad: 1.51e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.613 data: 0.0761 lr: 5.63e-05 mem: 47% pow: 649.808 W 0: INFO 26-04-29 06:07:18.705363 - 4:49:47 - step: 12150 acc: 0 loss: 1.7437 grad: 1.69e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6098 data: 0.0721 lr: 5.63e-05 mem: 47% pow: 653.28 W 0: INFO 26-04-29 06:07:33.179377 - 4:50:01 - step: 12160 acc: 0 loss: 1.9587 grad: 1.59e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.686 data: 0.0639 lr: 5.63e-05 mem: 47% pow: 627.056 W 0: INFO 26-04-29 06:07:47.536242 - 4:50:16 - step: 12170 acc: 0 loss: 1.72 grad: 1.53e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.8097 data: 0.0604 lr: 5.63e-05 mem: 47% pow: 561.52 W 0: INFO 26-04-29 06:08:01.974774 - 4:50:30 - step: 12180 acc: 0 loss: 1.6118 grad: 1.65e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6851 data: 0.0711 lr: 5.63e-05 mem: 47% pow: 610.334 W 0: INFO 26-04-29 06:08:15.925309 - 4:50:44 - step: 12190 acc: 0 loss: 1.6591 grad: 1.62e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6088 data: 0.0712 lr: 5.63e-05 mem: 47% pow: 644.752 W 0: INFO 26-04-29 06:08:31.179683 - 4:50:59 - step: 12200 acc: 0 loss: 1.7434 grad: 1.53e-01 flops: 3.70e+14 wps: 4.30e+04 iter: 0.733 data: 0.0677 lr: 5.62e-05 mem: 47% pow: 580.409 W 0: INFO 26-04-29 06:08:48.590906 - 4:51:17 - step: 12210 acc: 0 loss: 1.696 grad: 1.54e-01 flops: 3.24e+14 wps: 3.77e+04 iter: 0.6014 data: 0.0833 lr: 5.62e-05 mem: 54% pow: 647.055 W 0: INFO 26-04-29 06:09:02.764828 - 4:51:31 - step: 12220 acc: 0 loss: 1.7024 grad: 1.57e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6467 data: 0.0703 lr: 5.62e-05 mem: 47% pow: 651.293 W 0: INFO 26-04-29 06:09:17.853830 - 4:51:46 - step: 12230 acc: 0 loss: 1.7369 grad: 1.59e-01 flops: 3.74e+14 wps: 4.35e+04 iter: 0.5823 data: 0.1362 lr: 5.62e-05 mem: 47% pow: 648.648 W 0: INFO 26-04-29 06:09:32.936991 - 4:52:01 - step: 12240 acc: 0 loss: 2.1422 grad: 1.56e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.627 data: 0.0677 lr: 5.62e-05 mem: 47% pow: 655.524 W 0: INFO 26-04-29 06:09:47.585996 - 4:52:16 - step: 12250 acc: 0 loss: 1.8579 grad: 1.53e-01 flops: 3.86e+14 wps: 4.47e+04 iter: 0.6931 data: 0.0721 lr: 5.62e-05 mem: 47% pow: 610.125 W 0: INFO 26-04-29 06:10:02.605739 - 4:52:31 - step: 12260 acc: 0 loss: 1.8268 grad: 1.66e-01 flops: 3.76e+14 wps: 4.37e+04 iter: 0.7125 data: 0.0557 lr: 5.62e-05 mem: 47% pow: 615.833 W 0: INFO 26-04-29 06:10:16.929642 - 4:52:45 - step: 12270 acc: 0 loss: 1.9319 grad: 1.51e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6532 data: 0.0661 lr: 5.61e-05 mem: 47% pow: 630.468 W 0: INFO 26-04-29 06:10:31.849740 - 4:53:00 - step: 12280 acc: 0 loss: 1.695 grad: 1.52e-01 flops: 3.79e+14 wps: 4.39e+04 iter: 0.6717 data: 0.0554 lr: 5.61e-05 mem: 47% pow: 629.565 W 0: INFO 26-04-29 06:10:46.702462 - 4:53:15 - step: 12290 acc: 0 loss: 2.198 grad: 1.62e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.7316 data: 0.071 lr: 5.61e-05 mem: 47% pow: 586.578 W 0: INFO 26-04-29 06:11:01.661700 - 4:53:30 - step: 12300 acc: 0 loss: 1.5344 grad: 1.60e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 0.8755 data: 0.0618 lr: 5.61e-05 mem: 47% pow: 507.719 W 0: INFO 26-04-29 06:11:19.397300 - 4:53:47 - step: 12310 acc: 0 loss: 1.6654 grad: 1.65e-01 flops: 3.19e+14 wps: 3.70e+04 iter: 0.759 data: 0.0697 lr: 5.61e-05 mem: 54% pow: 575.872 W 0: INFO 26-04-29 06:11:34.387282 - 4:54:02 - step: 12320 acc: 0 loss: 1.7177 grad: 1.54e-01 flops: 3.77e+14 wps: 4.37e+04 iter: 0.7022 data: 0.003 lr: 5.61e-05 mem: 47% pow: 644.271 W 0: INFO 26-04-29 06:11:49.276841 - 4:54:17 - step: 12330 acc: 0 loss: 2.2733 grad: 1.56e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.8579 data: 0.0609 lr: 5.61e-05 mem: 47% pow: 518.596 W 0: INFO 26-04-29 06:12:04.049125 - 4:54:32 - step: 12340 acc: 0 loss: 1.4718 grad: 1.64e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.6223 data: 0.0838 lr: 5.60e-05 mem: 47% pow: 638.975 W 0: INFO 26-04-29 06:12:18.055986 - 4:54:46 - step: 12350 acc: 0 loss: 1.4579 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6624 data: 0.0515 lr: 5.60e-05 mem: 47% pow: 636.776 W 0: INFO 26-04-29 06:12:32.744845 - 4:55:01 - step: 12360 acc: 0 loss: 1.6766 grad: 1.56e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6549 data: 0.0685 lr: 5.60e-05 mem: 47% pow: 641.046 W 0: INFO 26-04-29 06:12:47.406175 - 4:55:15 - step: 12370 acc: 0 loss: 1.8013 grad: 1.57e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6562 data: 0.0427 lr: 5.60e-05 mem: 47% pow: 643.317 W 0: INFO 26-04-29 06:13:01.798419 - 4:55:30 - step: 12380 acc: 0 loss: 1.8219 grad: 1.57e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6097 data: 0.0668 lr: 5.60e-05 mem: 47% pow: 648.167 W 0: INFO 26-04-29 06:13:15.976995 - 4:55:44 - step: 12390 acc: 0 loss: 1.9527 grad: 1.58e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7471 data: 0.0719 lr: 5.60e-05 mem: 47% pow: 576.545 W 0: INFO 26-04-29 06:13:30.420517 - 4:55:59 - step: 12400 acc: 0 loss: 1.2816 grad: 1.62e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6093 data: 0.0808 lr: 5.60e-05 mem: 47% pow: 650.625 W 0: INFO 26-04-29 06:13:48.021274 - 4:56:16 - step: 12410 acc: 0 loss: 2.2596 grad: 1.70e-01 flops: 3.21e+14 wps: 3.73e+04 iter: 0.6687 data: 0.064 lr: 5.59e-05 mem: 54% pow: 639.449 W 0: INFO 26-04-29 06:14:04.487075 - 4:56:33 - step: 12420 acc: 0 loss: 2.0783 grad: 1.66e-01 flops: 3.49e+14 wps: 4.05e+04 iter: 0.6138 data: 0.0726 lr: 5.59e-05 mem: 47% pow: 657.152 W 0: INFO 26-04-29 06:14:19.559372 - 4:56:48 - step: 12430 acc: 0 loss: 1.8658 grad: 1.49e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.7067 data: 0.0701 lr: 5.59e-05 mem: 47% pow: 594.86 W 0: INFO 26-04-29 06:14:34.288538 - 4:57:02 - step: 12440 acc: 0 loss: 1.772 grad: 1.57e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.6827 data: 0.0749 lr: 5.59e-05 mem: 47% pow: 618.721 W 0: INFO 26-04-29 06:14:49.175915 - 4:57:17 - step: 12450 acc: 0 loss: 1.6898 grad: 1.59e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.6218 data: 0.0649 lr: 5.59e-05 mem: 47% pow: 656.237 W 0: INFO 26-04-29 06:15:03.567059 - 4:57:32 - step: 12460 acc: 0 loss: 1.5958 grad: 1.52e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6236 data: 0.0727 lr: 5.59e-05 mem: 47% pow: 643.515 W 0: INFO 26-04-29 06:15:18.593136 - 4:57:47 - step: 12470 acc: 0 loss: 1.3638 grad: 1.59e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.6589 data: 0.0635 lr: 5.58e-05 mem: 47% pow: 647.655 W 0: INFO 26-04-29 06:15:33.648902 - 4:58:02 - step: 12480 acc: 0 loss: 1.6598 grad: 1.58e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.662 data: 0.0704 lr: 5.58e-05 mem: 47% pow: 639.646 W 0: INFO 26-04-29 06:15:48.276757 - 4:58:16 - step: 12490 acc: 0 loss: 2.2127 grad: 1.60e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6994 data: 0.0754 lr: 5.58e-05 mem: 47% pow: 604.599 W 0: INFO 26-04-29 06:16:02.944272 - 4:58:31 - step: 12500 acc: 0 loss: 1.8345 grad: 1.59e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6481 data: 0.049 lr: 5.58e-05 mem: 47% pow: 639.34 W 0: INFO 26-04-29 06:16:20.476866 - 4:58:49 - step: 12510 acc: 0 loss: 1.772 grad: 1.55e-01 flops: 3.22e+14 wps: 3.74e+04 iter: 0.6259 data: 0.0645 lr: 5.58e-05 mem: 54% pow: 653.531 W 0: INFO 26-04-29 06:16:35.704406 - 4:59:04 - step: 12520 acc: 0 loss: 1.5795 grad: 1.54e-01 flops: 3.71e+14 wps: 4.31e+04 iter: 0.7573 data: 0.0642 lr: 5.58e-05 mem: 47% pow: 577.162 W 0: INFO 26-04-29 06:16:50.429125 - 4:59:19 - step: 12530 acc: 0 loss: 1.5161 grad: 1.63e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.8011 data: 0.0027 lr: 5.58e-05 mem: 47% pow: 589.371 W 0: INFO 26-04-29 06:17:05.611775 - 4:59:34 - step: 12540 acc: 0 loss: 1.7611 grad: 1.64e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.6184 data: 0.0686 lr: 5.57e-05 mem: 47% pow: 668.583 W 0: INFO 26-04-29 06:17:20.447775 - 4:59:49 - step: 12550 acc: 0 loss: 1.5206 grad: 1.50e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.8608 data: 0.0025 lr: 5.57e-05 mem: 47% pow: 546.796 W 0: INFO 26-04-29 06:17:35.230509 - 5:00:03 - step: 12560 acc: 0 loss: 1.8089 grad: 1.50e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.7199 data: 0.0713 lr: 5.57e-05 mem: 47% pow: 599.777 W 0: INFO 26-04-29 06:17:50.034576 - 5:00:18 - step: 12570 acc: 0 loss: 1.6576 grad: 1.65e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.612 data: 0.0681 lr: 5.57e-05 mem: 47% pow: 653.857 W 0: INFO 26-04-29 06:18:05.223928 - 5:00:33 - step: 12580 acc: 0 loss: 2.2784 grad: 1.56e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.6973 data: 0.0441 lr: 5.57e-05 mem: 47% pow: 620.65 W 0: INFO 26-04-29 06:18:20.048299 - 5:00:48 - step: 12590 acc: 0 loss: 1.8533 grad: 1.50e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6533 data: 0.0757 lr: 5.57e-05 mem: 47% pow: 629.967 W 0: INFO 26-04-29 06:18:34.660143 - 5:01:03 - step: 12600 acc: 0 loss: 1.7827 grad: 1.61e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6292 data: 0.0623 lr: 5.57e-05 mem: 47% pow: 656.549 W 0: INFO 26-04-29 06:18:52.666158 - 5:01:21 - step: 12610 acc: 0 loss: 1.4172 grad: 1.52e-01 flops: 3.14e+14 wps: 3.64e+04 iter: 0.781 data: 0.0762 lr: 5.56e-05 mem: 54% pow: 558.987 W 0: INFO 26-04-29 06:19:07.692098 - 5:01:36 - step: 12620 acc: 0 loss: 1.5332 grad: 1.53e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.7238 data: 0.0698 lr: 5.56e-05 mem: 47% pow: 590.504 W 0: INFO 26-04-29 06:19:22.533532 - 5:01:51 - step: 12630 acc: 0 loss: 1.4837 grad: 1.56e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.8978 data: 0.0771 lr: 5.56e-05 mem: 47% pow: 484.808 W 0: INFO 26-04-29 06:19:37.377256 - 5:02:05 - step: 12640 acc: 0 loss: 2.0843 grad: 1.53e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6736 data: 0.0814 lr: 5.56e-05 mem: 47% pow: 612.697 W 0: INFO 26-04-29 06:19:52.421330 - 5:02:21 - step: 12650 acc: 0 loss: 1.6075 grad: 1.48e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.8172 data: 0.0448 lr: 5.56e-05 mem: 47% pow: 555.343 W 0: INFO 26-04-29 06:20:07.212301 - 5:02:35 - step: 12660 acc: 0 loss: 1.9041 grad: 1.53e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.7878 data: 0.0694 lr: 5.56e-05 mem: 47% pow: 562.076 W 0: INFO 26-04-29 06:20:21.433099 - 5:02:50 - step: 12670 acc: 0 loss: 1.7074 grad: 1.47e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6332 data: 0.0733 lr: 5.55e-05 mem: 47% pow: 645.746 W 0: INFO 26-04-29 06:20:35.740419 - 5:03:04 - step: 12680 acc: 0 loss: 1.4848 grad: 1.67e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.7819 data: 0.0743 lr: 5.55e-05 mem: 47% pow: 559.081 W 0: INFO 26-04-29 06:20:50.654587 - 5:03:19 - step: 12690 acc: 0 loss: 1.7024 grad: 1.58e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.6904 data: 0.0027 lr: 5.55e-05 mem: 47% pow: 650.852 W 0: INFO 26-04-29 06:21:05.201897 - 5:03:33 - step: 12700 acc: 0 loss: 2.0091 grad: 1.57e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.6286 data: 0.0629 lr: 5.55e-05 mem: 47% pow: 653.489 W 0: INFO 26-04-29 06:21:22.657584 - 5:03:51 - step: 12710 acc: 0 loss: 1.5526 grad: 1.63e-01 flops: 3.24e+14 wps: 3.75e+04 iter: 0.7561 data: 0.0604 lr: 5.55e-05 mem: 54% pow: 574.558 W 0: INFO 26-04-29 06:21:37.062689 - 5:04:05 - step: 12720 acc: 0 loss: 1.6987 grad: 1.54e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6269 data: 0.0734 lr: 5.55e-05 mem: 47% pow: 640.092 W 0: INFO 26-04-29 06:21:52.240231 - 5:04:20 - step: 12730 acc: 0 loss: 2.1451 grad: 1.63e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.7916 data: 0.0691 lr: 5.55e-05 mem: 47% pow: 550.152 W 0: INFO 26-04-29 06:22:07.236324 - 5:04:35 - step: 12740 acc: 0 loss: 1.7502 grad: 1.56e-01 flops: 3.77e+14 wps: 4.37e+04 iter: 0.6914 data: 0.0598 lr: 5.54e-05 mem: 47% pow: 617.519 W 0: INFO 26-04-29 06:22:21.723852 - 5:04:50 - step: 12750 acc: 0 loss: 1.7666 grad: 1.53e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6144 data: 0.0814 lr: 5.54e-05 mem: 47% pow: 657.265 W 0: INFO 26-04-29 06:22:36.417368 - 5:05:05 - step: 12760 acc: 0 loss: 2.227 grad: 1.75e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6472 data: 0.0695 lr: 5.54e-05 mem: 47% pow: 634.915 W 0: INFO 26-04-29 06:22:51.093307 - 5:05:19 - step: 12770 acc: 0 loss: 1.741 grad: 1.59e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6558 data: 0.0694 lr: 5.54e-05 mem: 47% pow: 635.475 W 0: INFO 26-04-29 06:23:05.225935 - 5:05:33 - step: 12780 acc: 0 loss: 1.6724 grad: 1.51e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6261 data: 0.0739 lr: 5.54e-05 mem: 47% pow: 640.953 W 0: INFO 26-04-29 06:23:20.060095 - 5:05:48 - step: 12790 acc: 0 loss: 1.4151 grad: 1.59e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6765 data: 0.1528 lr: 5.54e-05 mem: 47% pow: 579.441 W 0: INFO 26-04-29 06:23:35.208682 - 5:06:03 - step: 12800 acc: 0 loss: 1.4381 grad: 1.63e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.6742 data: 0.0716 lr: 5.54e-05 mem: 47% pow: 632.977 W 0: INFO 26-04-29 06:23:52.946808 - 5:06:21 - step: 12810 acc: 0 loss: 1.6017 grad: 1.79e-01 flops: 3.18e+14 wps: 3.70e+04 iter: 0.6375 data: 0.0621 lr: 5.53e-05 mem: 54% pow: 646.86 W 0: INFO 26-04-29 06:24:07.765224 - 5:06:36 - step: 12820 acc: 0 loss: 1.4947 grad: 1.73e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.7446 data: 0.0678 lr: 5.53e-05 mem: 47% pow: 590.458 W 0: INFO 26-04-29 06:24:22.846584 - 5:06:51 - step: 12830 acc: 0 loss: 1.5039 grad: 1.78e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.7746 data: 0.0631 lr: 5.53e-05 mem: 47% pow: 564.977 W 0: INFO 26-04-29 06:24:38.141373 - 5:07:06 - step: 12840 acc: 0 loss: 1.7901 grad: 1.60e-01 flops: 3.69e+14 wps: 4.29e+04 iter: 0.578 data: 0.204 lr: 5.53e-05 mem: 47% pow: 593.884 W 0: INFO 26-04-29 06:24:52.898840 - 5:07:21 - step: 12850 acc: 0 loss: 1.6177 grad: 1.61e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6058 data: 0.076 lr: 5.53e-05 mem: 47% pow: 670.904 W 0: INFO 26-04-29 06:25:07.746711 - 5:07:36 - step: 12860 acc: 0 loss: 1.2065 grad: 2.05e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.856 data: 0.0026 lr: 5.53e-05 mem: 47% pow: 553.417 W 0: INFO 26-04-29 06:25:22.200303 - 5:07:50 - step: 12870 acc: 0 loss: 1.6613 grad: 1.80e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6364 data: 0.082 lr: 5.53e-05 mem: 47% pow: 632.25 W 0: INFO 26-04-29 06:25:36.815151 - 5:08:05 - step: 12880 acc: 0 loss: 1.7251 grad: 1.70e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6476 data: 0.0646 lr: 5.52e-05 mem: 47% pow: 639.509 W 0: INFO 26-04-29 06:25:51.397968 - 5:08:19 - step: 12890 acc: 0 loss: 1.5454 grad: 1.72e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.7598 data: 0.0724 lr: 5.52e-05 mem: 47% pow: 570.466 W 0: INFO 26-04-29 06:26:06.001995 - 5:08:34 - step: 12900 acc: 0 loss: 1.6899 grad: 1.58e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6362 data: 0.0659 lr: 5.52e-05 mem: 47% pow: 643.027 W 0: INFO 26-04-29 06:26:23.545576 - 5:08:52 - step: 12910 acc: 0 loss: 1.6231 grad: 1.64e-01 flops: 3.22e+14 wps: 3.74e+04 iter: 0.6557 data: 0.0722 lr: 5.52e-05 mem: 54% pow: 631.013 W 0: INFO 26-04-29 06:26:38.233373 - 5:09:06 - step: 12920 acc: 0 loss: 1.3748 grad: 1.61e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.724 data: 0.0906 lr: 5.52e-05 mem: 47% pow: 582.506 W 0: INFO 26-04-29 06:26:52.570828 - 5:09:21 - step: 12930 acc: 0 loss: 1.2781 grad: 1.67e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6275 data: 0.0798 lr: 5.52e-05 mem: 47% pow: 643.205 W 0: INFO 26-04-29 06:27:07.368648 - 5:09:35 - step: 12940 acc: 0 loss: 1.8099 grad: 1.69e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6201 data: 0.0646 lr: 5.51e-05 mem: 47% pow: 655.306 W 0: INFO 26-04-29 06:27:22.152346 - 5:09:50 - step: 12950 acc: 0 loss: 1.4753 grad: 1.60e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.7026 data: 0.0029 lr: 5.51e-05 mem: 47% pow: 645.662 W 0: INFO 26-04-29 06:27:36.923737 - 5:10:05 - step: 12960 acc: 0 loss: 2.1724 grad: 1.62e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.6462 data: 0.0782 lr: 5.51e-05 mem: 47% pow: 632.312 W 0: INFO 26-04-29 06:27:51.704216 - 5:10:20 - step: 12970 acc: 0 loss: 2.2946 grad: 1.64e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.611 data: 0.0917 lr: 5.51e-05 mem: 47% pow: 646.416 W 0: INFO 26-04-29 06:28:06.936330 - 5:10:35 - step: 12980 acc: 0 loss: 1.4835 grad: 1.56e-01 flops: 3.71e+14 wps: 4.30e+04 iter: 0.8282 data: 0.0699 lr: 5.51e-05 mem: 47% pow: 540.748 W 0: INFO 26-04-29 06:28:21.153707 - 5:10:49 - step: 12990 acc: 0 loss: 1.5592 grad: 1.56e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6388 data: 0.0583 lr: 5.51e-05 mem: 47% pow: 641.17 W 0: INFO 26-04-29 06:28:35.716552 - 5:11:04 - step: 13000 acc: 0 loss: 1.9777 grad: 1.67e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6237 data: 0.0756 lr: 5.51e-05 mem: 47% pow: 634.87 W 0: INFO 26-04-29 06:28:39.421433 - 5:11:08 - garbage collection 0: INFO 26-04-29 06:28:54.697285 - 5:11:23 - step: 13010 acc: 0 loss: 1.9003 grad: 1.63e-01 flops: 2.98e+14 wps: 3.45e+04 iter: 0.6644 data: 0.0628 lr: 5.50e-05 mem: 54% pow: 651.591 W 0: INFO 26-04-29 06:29:09.329754 - 5:11:37 - step: 13020 acc: 0 loss: 1.5756 grad: 1.61e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6504 data: 0.0696 lr: 5.50e-05 mem: 47% pow: 642.04 W 0: INFO 26-04-29 06:29:24.041405 - 5:11:52 - step: 13030 acc: 0 loss: 1.4228 grad: 1.56e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6113 data: 0.0733 lr: 5.50e-05 mem: 47% pow: 654.034 W 0: INFO 26-04-29 06:29:39.112394 - 5:12:07 - step: 13040 acc: 0 loss: 1.9807 grad: 1.60e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.7759 data: 0.0757 lr: 5.50e-05 mem: 47% pow: 566.566 W 0: INFO 26-04-29 06:29:53.604813 - 5:12:22 - step: 13050 acc: 0 loss: 1.6505 grad: 1.59e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.8085 data: 0.0538 lr: 5.50e-05 mem: 47% pow: 555.441 W 0: INFO 26-04-29 06:30:08.229113 - 5:12:36 - step: 13060 acc: 0 loss: 1.463 grad: 1.56e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.632 data: 0.0652 lr: 5.50e-05 mem: 47% pow: 654.075 W 0: INFO 26-04-29 06:30:23.259230 - 5:12:51 - step: 13070 acc: 0 loss: 1.7869 grad: 1.57e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.8375 data: 0.0654 lr: 5.50e-05 mem: 47% pow: 526.296 W 0: INFO 26-04-29 06:30:37.592729 - 5:13:06 - step: 13080 acc: 0 loss: 1.7722 grad: 1.61e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6137 data: 0.0725 lr: 5.49e-05 mem: 47% pow: 648.9 W 0: INFO 26-04-29 06:30:52.306124 - 5:13:20 - step: 13090 acc: 0 loss: 1.7131 grad: 1.76e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6194 data: 0.0648 lr: 5.49e-05 mem: 47% pow: 665.337 W 0: INFO 26-04-29 06:31:07.304739 - 5:13:35 - step: 13100 acc: 0 loss: 1.4347 grad: 1.88e-01 flops: 3.77e+14 wps: 4.37e+04 iter: 0.7701 data: 0.0751 lr: 5.49e-05 mem: 47% pow: 564.555 W 0: INFO 26-04-29 06:31:25.112029 - 5:13:53 - step: 13110 acc: 0 loss: 1.8203 grad: 1.67e-01 flops: 3.17e+14 wps: 3.68e+04 iter: 0.6361 data: 0.0818 lr: 5.49e-05 mem: 54% pow: 638.172 W 0: INFO 26-04-29 06:31:40.089227 - 5:14:08 - step: 13120 acc: 0 loss: 1.8192 grad: 1.61e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.7621 data: 0.0667 lr: 5.49e-05 mem: 47% pow: 585.717 W 0: INFO 26-04-29 06:31:54.850091 - 5:14:23 - step: 13130 acc: 0 loss: 1.8911 grad: 1.66e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.622 data: 0.0674 lr: 5.49e-05 mem: 47% pow: 649.884 W 0: INFO 26-04-29 06:32:09.702222 - 5:14:38 - step: 13140 acc: 0 loss: 1.9857 grad: 1.49e-01 flops: 3.80e+14 wps: 4.42e+04 iter: 0.7859 data: 0.0737 lr: 5.48e-05 mem: 47% pow: 552.583 W 0: INFO 26-04-29 06:32:24.649870 - 5:14:53 - step: 13150 acc: 0 loss: 1.7393 grad: 1.62e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.6872 data: 0.0706 lr: 5.48e-05 mem: 47% pow: 629.864 W 0: INFO 26-04-29 06:32:39.634245 - 5:15:08 - step: 13160 acc: 0 loss: 2.0676 grad: 1.52e-01 flops: 3.77e+14 wps: 4.38e+04 iter: 0.7047 data: 0.052 lr: 5.48e-05 mem: 47% pow: 610.638 W 0: INFO 26-04-29 06:32:54.093274 - 5:15:22 - step: 13170 acc: 0 loss: 1.4736 grad: 1.77e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6471 data: 0.0701 lr: 5.48e-05 mem: 47% pow: 643.067 W 0: INFO 26-04-29 06:33:08.600954 - 5:15:37 - step: 13180 acc: 0 loss: 1.4441 grad: 1.60e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6606 data: 0.0669 lr: 5.48e-05 mem: 47% pow: 633.75 W 0: INFO 26-04-29 06:33:23.250817 - 5:15:51 - step: 13190 acc: 0 loss: 1.8739 grad: 1.57e-01 flops: 3.86e+14 wps: 4.47e+04 iter: 0.7311 data: 0.0641 lr: 5.48e-05 mem: 47% pow: 590.393 W 0: INFO 26-04-29 06:33:37.716877 - 5:16:06 - step: 13200 acc: 0 loss: 1.7876 grad: 1.54e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.7481 data: 0.0713 lr: 5.48e-05 mem: 47% pow: 573.93 W 0: INFO 26-04-29 06:33:55.282725 - 5:16:23 - step: 13210 acc: 0 loss: 1.876 grad: 1.66e-01 flops: 3.21e+14 wps: 3.73e+04 iter: 0.675 data: 0.0746 lr: 5.47e-05 mem: 54% pow: 617.07 W 0: INFO 26-04-29 06:34:10.287587 - 5:16:38 - step: 13220 acc: 0 loss: 1.6103 grad: 1.54e-01 flops: 3.76e+14 wps: 4.37e+04 iter: 0.6523 data: 0.0598 lr: 5.47e-05 mem: 47% pow: 639.46 W 0: INFO 26-04-29 06:34:24.991176 - 5:16:53 - step: 13230 acc: 0 loss: 1.9871 grad: 1.60e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6125 data: 0.0803 lr: 5.47e-05 mem: 47% pow: 653.442 W 0: INFO 26-04-29 06:34:39.692704 - 5:17:08 - step: 13240 acc: 0 loss: 1.812 grad: 1.56e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.7551 data: 0.0533 lr: 5.47e-05 mem: 47% pow: 595.308 W 0: INFO 26-04-29 06:34:54.487868 - 5:17:23 - step: 13250 acc: 0 loss: 1.7146 grad: 6.81e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.7829 data: 0.076 lr: 5.47e-05 mem: 47% pow: 552.99 W 0: INFO 26-04-29 06:35:09.667208 - 5:17:38 - step: 13260 acc: 0 loss: 1.1464 grad: 1.60e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.9971 data: 0.0705 lr: 5.47e-05 mem: 47% pow: 454.723 W 0: INFO 26-04-29 06:35:24.817764 - 5:17:53 - step: 13270 acc: 0 loss: 1.3535 grad: 1.60e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.6779 data: 0.0821 lr: 5.47e-05 mem: 47% pow: 613.814 W 0: INFO 26-04-29 06:35:39.402502 - 5:18:07 - step: 13280 acc: 0 loss: 1.8601 grad: 1.72e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.5789 data: 0.1646 lr: 5.46e-05 mem: 47% pow: 614.466 W 0: INFO 26-04-29 06:35:54.039894 - 5:18:22 - step: 13290 acc: 0 loss: 2.1246 grad: 1.61e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.8942 data: 0.0025 lr: 5.46e-05 mem: 47% pow: 534.16 W 0: INFO 26-04-29 06:36:08.889768 - 5:18:37 - step: 13300 acc: 0 loss: 1.6868 grad: 1.72e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.6276 data: 0.0816 lr: 5.46e-05 mem: 47% pow: 641.38 W 0: INFO 26-04-29 06:36:26.009465 - 5:18:54 - step: 13310 acc: 0 loss: 1.9897 grad: 1.63e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6444 data: 0.0707 lr: 5.46e-05 mem: 54% pow: 637.967 W 0: INFO 26-04-29 06:36:40.639658 - 5:19:09 - step: 13320 acc: 0 loss: 1.8813 grad: 1.61e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.651 data: 0.0652 lr: 5.46e-05 mem: 47% pow: 643.093 W 0: INFO 26-04-29 06:36:55.116293 - 5:19:23 - step: 13330 acc: 0 loss: 1.5232 grad: 1.60e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.5796 data: 0.1038 lr: 5.46e-05 mem: 47% pow: 655.559 W 0: INFO 26-04-29 06:37:09.666208 - 5:19:38 - step: 13340 acc: 0 loss: 1.5083 grad: 1.55e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.6747 data: 0.0669 lr: 5.46e-05 mem: 47% pow: 614.65 W 0: INFO 26-04-29 06:37:24.086556 - 5:19:52 - step: 13350 acc: 0 loss: 1.2028 grad: 1.52e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6548 data: 0.0735 lr: 5.45e-05 mem: 47% pow: 624.688 W 0: INFO 26-04-29 06:37:38.386487 - 5:20:06 - step: 13360 acc: 0 loss: 1.6548 grad: 1.62e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.605 data: 0.0872 lr: 5.45e-05 mem: 47% pow: 645.766 W 0: INFO 26-04-29 06:37:52.742879 - 5:20:21 - step: 13370 acc: 0 loss: 1.691 grad: 1.78e-01 flops: 3.93e+14 wps: 4.57e+04 iter: 0.758 data: 0.0694 lr: 5.45e-05 mem: 47% pow: 576.158 W 0: INFO 26-04-29 06:38:07.125403 - 5:20:35 - step: 13380 acc: 0 loss: 1.7011 grad: 1.61e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6292 data: 0.0722 lr: 5.45e-05 mem: 47% pow: 640.481 W 0: INFO 26-04-29 06:38:21.469127 - 5:20:50 - step: 13390 acc: 0 loss: 1.3968 grad: 1.62e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.629 data: 0.0646 lr: 5.45e-05 mem: 47% pow: 648.099 W 0: INFO 26-04-29 06:38:36.029072 - 5:21:04 - step: 13400 acc: 0 loss: 1.8836 grad: 1.62e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6294 data: 0.0631 lr: 5.45e-05 mem: 47% pow: 654.094 W 0: INFO 26-04-29 06:38:53.398913 - 5:21:21 - step: 13410 acc: 0 loss: 1.5678 grad: 1.66e-01 flops: 3.25e+14 wps: 3.77e+04 iter: 0.7409 data: 0.0643 lr: 5.44e-05 mem: 54% pow: 592.293 W 0: INFO 26-04-29 06:39:08.108441 - 5:21:36 - step: 13420 acc: 0 loss: 1.564 grad: 1.63e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.663 data: 0.0774 lr: 5.44e-05 mem: 47% pow: 615.045 W 0: INFO 26-04-29 06:39:22.635767 - 5:21:51 - step: 13430 acc: 0 loss: 1.6985 grad: 1.76e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6254 data: 0.113 lr: 5.44e-05 mem: 47% pow: 621.46 W 0: INFO 26-04-29 06:39:37.346646 - 5:22:05 - step: 13440 acc: 0 loss: 1.5067 grad: 1.69e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6964 data: 0.071 lr: 5.44e-05 mem: 47% pow: 614.702 W 0: INFO 26-04-29 06:39:51.848761 - 5:22:20 - step: 13450 acc: 0 loss: 1.2614 grad: 1.72e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.7352 data: 0.0788 lr: 5.44e-05 mem: 47% pow: 575.643 W 0: INFO 26-04-29 06:40:06.417744 - 5:22:35 - step: 13460 acc: 0 loss: 1.7115 grad: 1.64e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6062 data: 0.0793 lr: 5.44e-05 mem: 47% pow: 650.347 W 0: INFO 26-04-29 06:40:21.336289 - 5:22:49 - step: 13470 acc: 0 loss: 2.1141 grad: 1.60e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.6871 data: 0.0639 lr: 5.44e-05 mem: 47% pow: 610.944 W 0: INFO 26-04-29 06:40:36.356940 - 5:23:04 - step: 13480 acc: 0 loss: 1.638 grad: 1.66e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.608 data: 0.0763 lr: 5.43e-05 mem: 47% pow: 653.724 W 0: INFO 26-04-29 06:40:50.924577 - 5:23:19 - step: 13490 acc: 0 loss: 2.0608 grad: 1.57e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6369 data: 0.0525 lr: 5.43e-05 mem: 47% pow: 649.236 W 0: INFO 26-04-29 06:41:05.638054 - 5:23:34 - step: 13500 acc: 0 loss: 1.8425 grad: 1.67e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6109 data: 0.0902 lr: 5.43e-05 mem: 47% pow: 642.001 W 0: INFO 26-04-29 06:41:22.920795 - 5:23:51 - step: 13510 acc: 0 loss: 1.7086 grad: 1.68e-01 flops: 3.27e+14 wps: 3.79e+04 iter: 0.673 data: 0.0668 lr: 5.43e-05 mem: 54% pow: 638.546 W 0: INFO 26-04-29 06:41:38.012941 - 5:24:06 - step: 13520 acc: 0 loss: 1.8539 grad: 1.80e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.7447 data: 0.0714 lr: 5.43e-05 mem: 47% pow: 578.642 W 0: INFO 26-04-29 06:41:53.445683 - 5:24:22 - step: 13530 acc: 0 loss: 1.918 grad: 1.62e-01 flops: 3.66e+14 wps: 4.25e+04 iter: 0.6382 data: 0.0557 lr: 5.43e-05 mem: 47% pow: 646.366 W 0: INFO 26-04-29 06:42:07.841196 - 5:24:36 - step: 13540 acc: 0 loss: 1.8818 grad: 1.63e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6505 data: 0.0687 lr: 5.43e-05 mem: 47% pow: 629.947 W 0: INFO 26-04-29 06:42:23.119662 - 5:24:51 - step: 13550 acc: 0 loss: 1.8518 grad: 1.74e-01 flops: 3.70e+14 wps: 4.29e+04 iter: 0.6855 data: 0.0225 lr: 5.42e-05 mem: 47% pow: 638.071 W 0: INFO 26-04-29 06:42:39.048084 - 5:25:07 - step: 13560 acc: 0 loss: 1.8783 grad: 1.63e-01 flops: 3.62e+14 wps: 4.20e+04 iter: 1.2842 data: 0.078 lr: 5.42e-05 mem: 47% pow: 431.452 W 0: INFO 26-04-29 06:42:54.280423 - 5:25:22 - step: 13570 acc: 0 loss: 1.8724 grad: 1.64e-01 flops: 3.71e+14 wps: 4.30e+04 iter: 0.7035 data: 0.0658 lr: 5.42e-05 mem: 47% pow: 606.845 W 0: INFO 26-04-29 06:43:09.030219 - 5:25:37 - step: 13580 acc: 0 loss: 1.6204 grad: 1.89e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6305 data: 0.0801 lr: 5.42e-05 mem: 47% pow: 648.635 W 0: INFO 26-04-29 06:43:27.134440 - 5:25:55 - step: 13590 acc: 0 loss: 1.7274 grad: 1.78e-01 flops: 3.12e+14 wps: 3.62e+04 iter: 0.6308 data: 0.0716 lr: 5.42e-05 mem: 47% pow: 643.269 W 0: INFO 26-04-29 06:43:41.264632 - 5:26:09 - step: 13600 acc: 0 loss: 1.5771 grad: 1.86e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6054 data: 0.0695 lr: 5.42e-05 mem: 47% pow: 656.816 W 0: INFO 26-04-29 06:43:58.980566 - 5:26:27 - step: 13610 acc: 0 loss: 1.6013 grad: 1.77e-01 flops: 3.19e+14 wps: 3.70e+04 iter: 0.6295 data: 0.0773 lr: 5.41e-05 mem: 54% pow: 651.903 W 0: INFO 26-04-29 06:44:13.674202 - 5:26:42 - step: 13620 acc: 0 loss: 1.8935 grad: 1.67e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6239 data: 0.0739 lr: 5.41e-05 mem: 47% pow: 645.571 W 0: INFO 26-04-29 06:44:28.632696 - 5:26:57 - step: 13630 acc: 0 loss: 1.4609 grad: 1.70e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 0.7376 data: 0.0597 lr: 5.41e-05 mem: 47% pow: 588.262 W 0: INFO 26-04-29 06:44:43.594240 - 5:27:12 - step: 13640 acc: 0 loss: 1.9839 grad: 1.91e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 0.6267 data: 0.0668 lr: 5.41e-05 mem: 47% pow: 660.209 W 0: INFO 26-04-29 06:44:58.069349 - 5:27:26 - step: 13650 acc: 0 loss: 1.5749 grad: 1.81e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6564 data: 0.0594 lr: 5.41e-05 mem: 47% pow: 626.487 W 0: INFO 26-04-29 06:45:12.509673 - 5:27:41 - step: 13660 acc: 0 loss: 1.008 grad: 2.03e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6504 data: 0.0567 lr: 5.41e-05 mem: 47% pow: 638.919 W 0: INFO 26-04-29 06:45:26.874732 - 5:27:55 - step: 13670 acc: 0 loss: 1.5098 grad: 1.71e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6196 data: 0.0935 lr: 5.41e-05 mem: 47% pow: 631.189 W 0: INFO 26-04-29 06:45:41.271211 - 5:28:09 - step: 13680 acc: 0 loss: 1.5094 grad: 1.75e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6415 data: 0.0747 lr: 5.40e-05 mem: 47% pow: 634.064 W 0: INFO 26-04-29 06:45:55.998012 - 5:28:24 - step: 13690 acc: 0 loss: 1.528 grad: 1.73e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.7057 data: 0.0742 lr: 5.40e-05 mem: 47% pow: 594.378 W 0: INFO 26-04-29 06:46:11.386781 - 5:28:39 - step: 13700 acc: 0 loss: 1.9921 grad: 1.69e-01 flops: 3.67e+14 wps: 4.26e+04 iter: 0.6581 data: 0.0902 lr: 5.40e-05 mem: 47% pow: 621.272 W 0: INFO 26-04-29 06:46:29.222406 - 5:28:57 - step: 13710 acc: 0 loss: 1.9095 grad: 1.63e-01 flops: 3.17e+14 wps: 3.68e+04 iter: 0.7896 data: 0.0692 lr: 5.40e-05 mem: 54% pow: 555.22 W 0: INFO 26-04-29 06:46:43.966792 - 5:29:12 - step: 13720 acc: 0 loss: 1.8652 grad: 1.65e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6581 data: 0.0603 lr: 5.40e-05 mem: 47% pow: 618.465 W 0: INFO 26-04-29 06:46:59.012427 - 5:29:27 - step: 13730 acc: 0 loss: 1.577 grad: 1.69e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.7356 data: 0.0544 lr: 5.40e-05 mem: 47% pow: 586.618 W 0: INFO 26-04-29 06:47:13.523535 - 5:29:42 - step: 13740 acc: 0 loss: 1.578 grad: 1.56e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6885 data: 0.0747 lr: 5.40e-05 mem: 47% pow: 624.072 W 0: INFO 26-04-29 06:47:28.343039 - 5:29:56 - step: 13750 acc: 0 loss: 1.9848 grad: 1.64e-01 flops: 3.81e+14 wps: 4.43e+04 iter: 0.6662 data: 0.0747 lr: 5.39e-05 mem: 47% pow: 616.948 W 0: INFO 26-04-29 06:47:42.646423 - 5:30:11 - step: 13760 acc: 0 loss: 1.6515 grad: 1.62e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.7814 data: 0.0334 lr: 5.39e-05 mem: 47% pow: 582.877 W 0: INFO 26-04-29 06:47:57.501332 - 5:30:26 - step: 13770 acc: 0 loss: 1.5988 grad: 1.80e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.7466 data: 0.0796 lr: 5.39e-05 mem: 47% pow: 573.578 W 0: INFO 26-04-29 06:48:12.280676 - 5:30:40 - step: 13780 acc: 0 loss: 1.7063 grad: 1.60e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.6059 data: 0.0839 lr: 5.39e-05 mem: 47% pow: 653.046 W 0: INFO 26-04-29 06:48:26.554661 - 5:30:55 - step: 13790 acc: 0 loss: 1.2384 grad: 1.61e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.656 data: 0.0787 lr: 5.39e-05 mem: 47% pow: 632.101 W 0: INFO 26-04-29 06:48:41.314129 - 5:31:09 - step: 13800 acc: 0 loss: 1.9858 grad: 1.72e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6327 data: 0.0587 lr: 5.39e-05 mem: 47% pow: 647.92 W 0: INFO 26-04-29 06:49:00.212679 - 5:31:28 - step: 13810 acc: 0 loss: 1.4485 grad: 1.71e-01 flops: 2.99e+14 wps: 3.47e+04 iter: 0.6237 data: 0.0778 lr: 5.39e-05 mem: 54% pow: 637.767 W 0: INFO 26-04-29 06:49:14.851160 - 5:31:43 - step: 13820 acc: 0 loss: 2.2515 grad: 1.65e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.627 data: 0.0621 lr: 5.38e-05 mem: 47% pow: 650.051 W 0: INFO 26-04-29 06:49:29.594858 - 5:31:58 - step: 13830 acc: 0 loss: 2.0789 grad: 1.98e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6176 data: 0.0792 lr: 5.38e-05 mem: 47% pow: 645.726 W 0: INFO 26-04-29 06:49:44.225518 - 5:32:12 - step: 13840 acc: 0 loss: 1.9936 grad: 1.76e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6547 data: 0.068 lr: 5.38e-05 mem: 47% pow: 630.377 W 0: INFO 26-04-29 06:49:59.078500 - 5:32:27 - step: 13850 acc: 0 loss: 1.5045 grad: 1.76e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.6513 data: 0.0516 lr: 5.38e-05 mem: 47% pow: 644.182 W 0: INFO 26-04-29 06:50:13.438392 - 5:32:42 - step: 13860 acc: 0 loss: 1.5661 grad: 1.60e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6163 data: 0.0698 lr: 5.38e-05 mem: 47% pow: 650.651 W 0: INFO 26-04-29 06:50:27.909703 - 5:32:56 - step: 13870 acc: 0 loss: 1.6888 grad: 1.61e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6655 data: 0.0541 lr: 5.38e-05 mem: 47% pow: 626.952 W 0: INFO 26-04-29 06:50:42.265938 - 5:33:10 - step: 13880 acc: 0 loss: 1.5428 grad: 1.67e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.618 data: 0.0691 lr: 5.37e-05 mem: 47% pow: 658.79 W 0: INFO 26-04-29 06:50:57.104800 - 5:33:25 - step: 13890 acc: 0 loss: 1.8428 grad: 1.69e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6574 data: 0.0562 lr: 5.37e-05 mem: 47% pow: 637.312 W 0: INFO 26-04-29 06:51:11.575615 - 5:33:40 - step: 13900 acc: 0 loss: 1.693 grad: 1.73e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.8362 data: 0.0709 lr: 5.37e-05 mem: 47% pow: 529.67 W 0: INFO 26-04-29 06:51:28.961215 - 5:33:57 - step: 13910 acc: 0 loss: 1.3338 grad: 1.54e-01 flops: 3.25e+14 wps: 3.77e+04 iter: 0.7103 data: 0.0564 lr: 5.37e-05 mem: 54% pow: 611.909 W 0: INFO 26-04-29 06:51:43.483678 - 5:34:12 - step: 13920 acc: 0 loss: 1.7212 grad: 1.69e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6529 data: 0.0563 lr: 5.37e-05 mem: 47% pow: 638.443 W 0: INFO 26-04-29 06:51:58.482763 - 5:34:27 - step: 13930 acc: 0 loss: 1.8218 grad: 1.68e-01 flops: 3.77e+14 wps: 4.37e+04 iter: 0.9905 data: 0.0742 lr: 5.37e-05 mem: 47% pow: 449.956 W 0: INFO 26-04-29 06:52:12.933549 - 5:34:41 - step: 13940 acc: 0 loss: 1.802 grad: 1.73e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6124 data: 0.0832 lr: 5.37e-05 mem: 47% pow: 643.781 W 0: INFO 26-04-29 06:52:27.318677 - 5:34:55 - step: 13950 acc: 0 loss: 1.768 grad: 1.71e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6166 data: 0.0912 lr: 5.36e-05 mem: 47% pow: 640.898 W 0: INFO 26-04-29 06:52:41.630525 - 5:35:10 - step: 13960 acc: 0 loss: 1.7122 grad: 1.71e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6385 data: 0.0813 lr: 5.36e-05 mem: 47% pow: 625.879 W 0: INFO 26-04-29 06:52:56.702386 - 5:35:25 - step: 13970 acc: 0 loss: 1.4904 grad: 1.68e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.6324 data: 0.0932 lr: 5.36e-05 mem: 47% pow: 628.385 W 0: INFO 26-04-29 06:53:11.270991 - 5:35:39 - step: 13980 acc: 0 loss: 1.5997 grad: 1.62e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6897 data: 0.0681 lr: 5.36e-05 mem: 47% pow: 614.543 W 0: INFO 26-04-29 06:53:26.027064 - 5:35:54 - step: 13990 acc: 0 loss: 1.6879 grad: 1.70e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6023 data: 0.0733 lr: 5.36e-05 mem: 47% pow: 657.422 W 0: INFO 26-04-29 06:53:40.312445 - 5:36:08 - step: 14000 acc: 0 loss: 2.2235 grad: 1.71e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6065 data: 0.0752 lr: 5.36e-05 mem: 47% pow: 657.577 W 0: INFO 26-04-29 06:53:43.997181 - 5:36:12 - garbage collection 0: INFO 26-04-29 06:53:59.221732 - 5:36:27 - step: 14010 acc: 0 loss: 2.299 grad: 1.59e-01 flops: 2.99e+14 wps: 3.47e+04 iter: 0.6329 data: 0.071 lr: 5.36e-05 mem: 54% pow: 649.174 W 0: INFO 26-04-29 06:54:13.882068 - 5:36:42 - step: 14020 acc: 0 loss: 1.647 grad: 1.69e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6431 data: 0.0682 lr: 5.35e-05 mem: 47% pow: 637.5 W 0: INFO 26-04-29 06:54:28.238863 - 5:36:56 - step: 14030 acc: 0 loss: 1.5792 grad: 1.63e-01 flops: 3.93e+14 wps: 4.57e+04 iter: 0.6372 data: 0.069 lr: 5.35e-05 mem: 47% pow: 639.967 W 0: INFO 26-04-29 06:54:42.472430 - 5:37:11 - step: 14040 acc: 0 loss: 1.9953 grad: 1.63e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6044 data: 0.0696 lr: 5.35e-05 mem: 47% pow: 664.791 W 0: INFO 26-04-29 06:54:56.842054 - 5:37:25 - step: 14050 acc: 0 loss: 1.7821 grad: 1.72e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6323 data: 0.0713 lr: 5.35e-05 mem: 47% pow: 641.535 W 0: INFO 26-04-29 06:55:10.887937 - 5:37:39 - step: 14060 acc: 0 loss: 1.6165 grad: 2.10e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6437 data: 0.0923 lr: 5.35e-05 mem: 47% pow: 623.169 W 0: INFO 26-04-29 06:55:24.941827 - 5:37:53 - step: 14070 acc: 0 loss: 1.983 grad: 1.72e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6595 data: 0.0631 lr: 5.35e-05 mem: 47% pow: 637.777 W 0: INFO 26-04-29 06:55:39.868161 - 5:38:08 - step: 14080 acc: 0 loss: 1.9741 grad: 1.66e-01 flops: 3.81e+14 wps: 4.43e+04 iter: 0.6403 data: 0.058 lr: 5.35e-05 mem: 47% pow: 639.966 W 0: INFO 26-04-29 06:55:55.042316 - 5:38:23 - step: 14090 acc: 0 loss: 1.9311 grad: 1.76e-01 flops: 3.73e+14 wps: 4.32e+04 iter: 0.604 data: 0.0695 lr: 5.34e-05 mem: 47% pow: 659.631 W 0: INFO 26-04-29 06:56:09.220931 - 5:38:37 - step: 14100 acc: 0 loss: 1.8941 grad: 1.66e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6502 data: 0.0683 lr: 5.34e-05 mem: 47% pow: 636.179 W 0: INFO 26-04-29 06:56:26.325849 - 5:38:54 - step: 14110 acc: 0 loss: 1.979 grad: 1.75e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.7258 data: 0.1714 lr: 5.34e-05 mem: 54% pow: 533.693 W 0: INFO 26-04-29 06:56:40.479674 - 5:39:09 - step: 14120 acc: 0 loss: 1.6981 grad: 1.62e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6265 data: 0.0594 lr: 5.34e-05 mem: 47% pow: 658.536 W 0: INFO 26-04-29 06:56:54.224102 - 5:39:22 - step: 14130 acc: 0 loss: 1.8785 grad: 1.63e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6416 data: 0.0619 lr: 5.34e-05 mem: 47% pow: 661.912 W 0: INFO 26-04-29 06:57:08.756835 - 5:39:37 - step: 14140 acc: 0 loss: 1.6654 grad: 1.65e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6297 data: 0.0666 lr: 5.34e-05 mem: 47% pow: 640.824 W 0: INFO 26-04-29 06:57:23.169563 - 5:39:51 - step: 14150 acc: 0 loss: 1.8756 grad: 1.77e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5931 data: 0.0833 lr: 5.33e-05 mem: 47% pow: 654.827 W 0: INFO 26-04-29 06:57:37.269494 - 5:40:05 - step: 14160 acc: 0 loss: 2.1367 grad: 1.63e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6254 data: 0.0706 lr: 5.33e-05 mem: 47% pow: 645.809 W 0: INFO 26-04-29 06:57:50.903305 - 5:40:19 - step: 14170 acc: 0 loss: 1.6336 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6663 data: 0.0635 lr: 5.33e-05 mem: 47% pow: 637.387 W 0: INFO 26-04-29 06:58:05.072418 - 5:40:33 - step: 14180 acc: 0 loss: 1.7667 grad: 1.68e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5776 data: 0.157 lr: 5.33e-05 mem: 47% pow: 620.775 W 0: INFO 26-04-29 06:58:19.342482 - 5:40:47 - step: 14190 acc: 0 loss: 1.6916 grad: 1.63e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6271 data: 0.0918 lr: 5.33e-05 mem: 47% pow: 627.523 W 0: INFO 26-04-29 06:58:33.677241 - 5:41:02 - step: 14200 acc: 0 loss: 1.3932 grad: 1.76e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6632 data: 0.0704 lr: 5.33e-05 mem: 47% pow: 623.899 W 0: INFO 26-04-29 06:58:50.774292 - 5:41:19 - step: 14210 acc: 0 loss: 2.0285 grad: 1.65e-01 flops: 3.30e+14 wps: 3.84e+04 iter: 0.6241 data: 0.0658 lr: 5.33e-05 mem: 54% pow: 661.947 W 0: INFO 26-04-29 06:59:04.459702 - 5:41:33 - step: 14220 acc: 0 loss: 1.6101 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6618 data: 0.0573 lr: 5.32e-05 mem: 47% pow: 649.802 W 0: INFO 26-04-29 06:59:18.532440 - 5:41:47 - step: 14230 acc: 0 loss: 2.3826 grad: 1.71e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.635 data: 0.0559 lr: 5.32e-05 mem: 47% pow: 650.561 W 0: INFO 26-04-29 06:59:32.959131 - 5:42:01 - step: 14240 acc: 0 loss: 1.8577 grad: 1.66e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6192 data: 0.068 lr: 5.32e-05 mem: 47% pow: 656.916 W 0: INFO 26-04-29 06:59:46.995588 - 5:42:15 - step: 14250 acc: 0 loss: 1.4746 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6398 data: 0.066 lr: 5.32e-05 mem: 47% pow: 638.547 W 0: INFO 26-04-29 07:00:00.893638 - 5:42:29 - step: 14260 acc: 0 loss: 1.7264 grad: 1.59e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5886 data: 0.0922 lr: 5.32e-05 mem: 47% pow: 653.05 W 0: INFO 26-04-29 07:00:16.044041 - 5:42:44 - step: 14270 acc: 0 loss: 1.6101 grad: 1.77e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.7353 data: 0.0604 lr: 5.32e-05 mem: 47% pow: 588.463 W 0: INFO 26-04-29 07:00:29.941538 - 5:42:58 - step: 14280 acc: 0 loss: 1.8252 grad: 3.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6127 data: 0.0677 lr: 5.32e-05 mem: 47% pow: 650.311 W 0: INFO 26-04-29 07:00:43.959869 - 5:43:12 - step: 14290 acc: 0 loss: 1.8123 grad: 1.67e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6175 data: 0.0666 lr: 5.31e-05 mem: 47% pow: 648.97 W 0: INFO 26-04-29 07:00:57.808062 - 5:43:26 - step: 14300 acc: 0 loss: 1.7119 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6456 data: 0.0486 lr: 5.31e-05 mem: 47% pow: 647.873 W 0: INFO 26-04-29 07:01:14.800558 - 5:43:43 - step: 14310 acc: 0 loss: 1.6839 grad: 1.67e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.634 data: 0.0915 lr: 5.31e-05 mem: 54% pow: 627.827 W 0: INFO 26-04-29 07:01:29.052697 - 5:43:57 - step: 14320 acc: 0 loss: 2.038 grad: 1.60e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6236 data: 0.0716 lr: 5.31e-05 mem: 47% pow: 650.378 W 0: INFO 26-04-29 07:01:43.116811 - 5:44:11 - step: 14330 acc: 0 loss: 1.6686 grad: 1.63e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6374 data: 0.0482 lr: 5.31e-05 mem: 47% pow: 653.666 W 0: INFO 26-04-29 07:01:57.743788 - 5:44:26 - step: 14340 acc: 0 loss: 2.2295 grad: 1.63e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.5992 data: 0.0723 lr: 5.31e-05 mem: 47% pow: 666.228 W 0: INFO 26-04-29 07:02:11.860790 - 5:44:40 - step: 14350 acc: 0 loss: 1.4912 grad: 1.59e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.9487 data: 0.0784 lr: 5.30e-05 mem: 47% pow: 455.153 W 0: INFO 26-04-29 07:02:25.717082 - 5:44:54 - step: 14360 acc: 0 loss: 1.763 grad: 1.81e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6208 data: 0.0655 lr: 5.30e-05 mem: 47% pow: 651.965 W 0: INFO 26-04-29 07:02:39.705778 - 5:45:08 - step: 14370 acc: 0 loss: 1.907 grad: 1.75e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6849 data: 0.0025 lr: 5.30e-05 mem: 47% pow: 652.984 W 0: INFO 26-04-29 07:02:53.772697 - 5:45:22 - step: 14380 acc: 0 loss: 1.6961 grad: 1.82e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5992 data: 0.0923 lr: 5.30e-05 mem: 47% pow: 652.82 W 0: INFO 26-04-29 07:03:07.702191 - 5:45:36 - step: 14390 acc: 0 loss: 1.7315 grad: 1.65e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5886 data: 0.1156 lr: 5.30e-05 mem: 47% pow: 641.311 W 0: INFO 26-04-29 07:03:21.680856 - 5:45:50 - step: 14400 acc: 0 loss: 2.0952 grad: 1.58e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6783 data: 0.0704 lr: 5.30e-05 mem: 47% pow: 625.151 W 0: INFO 26-04-29 07:03:38.711788 - 5:46:07 - step: 14410 acc: 0 loss: 1.2506 grad: 1.52e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.8621 data: 0.0719 lr: 5.30e-05 mem: 54% pow: 518.781 W 0: INFO 26-04-29 07:03:52.671311 - 5:46:21 - step: 14420 acc: 0 loss: 2.0175 grad: 1.60e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6854 data: 0.0703 lr: 5.29e-05 mem: 47% pow: 616.401 W 0: INFO 26-04-29 07:04:07.343280 - 5:46:35 - step: 14430 acc: 0 loss: 1.5688 grad: 1.61e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6784 data: 0.0726 lr: 5.29e-05 mem: 47% pow: 614.353 W 0: INFO 26-04-29 07:04:21.035706 - 5:46:49 - step: 14440 acc: 0 loss: 1.7691 grad: 1.62e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6759 data: 0.0672 lr: 5.29e-05 mem: 47% pow: 619.269 W 0: INFO 26-04-29 07:04:35.154290 - 5:47:03 - step: 14450 acc: 0 loss: 1.6174 grad: 1.57e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6236 data: 0.0542 lr: 5.29e-05 mem: 47% pow: 658.813 W 0: INFO 26-04-29 07:04:49.326897 - 5:47:17 - step: 14460 acc: 0 loss: 1.6898 grad: 1.62e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6308 data: 0.0662 lr: 5.29e-05 mem: 47% pow: 641.305 W 0: INFO 26-04-29 07:05:03.018444 - 5:47:31 - step: 14470 acc: 0 loss: 2.0375 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6178 data: 0.0636 lr: 5.29e-05 mem: 47% pow: 651.957 W 0: INFO 26-04-29 07:05:17.213677 - 5:47:45 - step: 14480 acc: 0 loss: 1.8357 grad: 1.68e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6993 data: 0.0568 lr: 5.29e-05 mem: 47% pow: 609.577 W 0: INFO 26-04-29 07:05:31.422027 - 5:48:00 - step: 14490 acc: 0 loss: 1.5431 grad: 1.60e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6259 data: 0.0828 lr: 5.28e-05 mem: 47% pow: 631.356 W 0: INFO 26-04-29 07:05:45.479067 - 5:48:14 - step: 14500 acc: 0 loss: 1.4362 grad: 1.66e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6221 data: 0.0618 lr: 5.28e-05 mem: 47% pow: 655.325 W 0: INFO 26-04-29 07:06:02.499690 - 5:48:31 - step: 14510 acc: 0 loss: 1.6648 grad: 1.66e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.6505 data: 0.0635 lr: 5.28e-05 mem: 54% pow: 640.69 W 0: INFO 26-04-29 07:06:16.822196 - 5:48:45 - step: 14520 acc: 0 loss: 1.874 grad: 1.52e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6969 data: 0.0678 lr: 5.28e-05 mem: 47% pow: 610.544 W 0: INFO 26-04-29 07:06:31.287263 - 5:48:59 - step: 14530 acc: 0 loss: 1.6677 grad: 1.60e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6289 data: 0.0784 lr: 5.28e-05 mem: 47% pow: 640.402 W 0: INFO 26-04-29 07:06:45.367658 - 5:49:13 - step: 14540 acc: 0 loss: 1.2118 grad: 1.54e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6101 data: 0.0652 lr: 5.28e-05 mem: 47% pow: 659.541 W 0: INFO 26-04-29 07:06:59.544329 - 5:49:28 - step: 14550 acc: 0 loss: 1.634 grad: 1.59e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6207 data: 0.0756 lr: 5.28e-05 mem: 47% pow: 654.602 W 0: INFO 26-04-29 07:07:13.418071 - 5:49:42 - step: 14560 acc: 0 loss: 1.8306 grad: 1.54e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6986 data: 0.0786 lr: 5.27e-05 mem: 47% pow: 595.208 W 0: INFO 26-04-29 07:07:27.740623 - 5:49:56 - step: 14570 acc: 0 loss: 1.8813 grad: 1.61e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6205 data: 0.0667 lr: 5.27e-05 mem: 47% pow: 647.343 W 0: INFO 26-04-29 07:07:42.071007 - 5:50:10 - step: 14580 acc: 0 loss: 2.0418 grad: 1.63e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5971 data: 0.0998 lr: 5.27e-05 mem: 47% pow: 647.83 W 0: INFO 26-04-29 07:07:56.528454 - 5:50:25 - step: 14590 acc: 0 loss: 1.8361 grad: 1.57e-01 flops: 3.91e+14 wps: 4.53e+04 iter: 0.618 data: 0.0686 lr: 5.27e-05 mem: 47% pow: 662.416 W 0: INFO 26-04-29 07:08:10.515210 - 5:50:39 - step: 14600 acc: 0 loss: 1.7954 grad: 1.64e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7828 data: 0.0256 lr: 5.27e-05 mem: 47% pow: 600.165 W 0: INFO 26-04-29 07:08:27.285338 - 5:50:55 - step: 14610 acc: 0 loss: 1.8447 grad: 1.58e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6155 data: 0.0675 lr: 5.27e-05 mem: 54% pow: 654.357 W 0: INFO 26-04-29 07:08:41.139593 - 5:51:09 - step: 14620 acc: 0 loss: 1.7744 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5807 data: 0.1033 lr: 5.26e-05 mem: 47% pow: 654.582 W 0: INFO 26-04-29 07:08:55.298389 - 5:51:23 - step: 14630 acc: 0 loss: 1.9248 grad: 1.53e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.7188 data: 0.0665 lr: 5.26e-05 mem: 47% pow: 597.471 W 0: INFO 26-04-29 07:09:08.872702 - 5:51:37 - step: 14640 acc: 0 loss: 1.7971 grad: 1.75e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6109 data: 0.0776 lr: 5.26e-05 mem: 47% pow: 657.595 W 0: INFO 26-04-29 07:09:22.815354 - 5:51:51 - step: 14650 acc: 0 loss: 1.8195 grad: 1.58e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5909 data: 0.085 lr: 5.26e-05 mem: 47% pow: 656.094 W 0: INFO 26-04-29 07:09:37.444872 - 5:52:06 - step: 14660 acc: 0 loss: 1.7515 grad: 1.51e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.5991 data: 0.0828 lr: 5.26e-05 mem: 47% pow: 652.041 W 0: INFO 26-04-29 07:09:51.881944 - 5:52:20 - step: 14670 acc: 0 loss: 1.9664 grad: 1.61e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.5988 data: 0.0902 lr: 5.26e-05 mem: 47% pow: 649.178 W 0: INFO 26-04-29 07:10:06.281396 - 5:52:34 - step: 14680 acc: 0 loss: 1.4126 grad: 1.57e-01 flops: 3.92e+14 wps: 4.56e+04 iter: 0.6149 data: 0.0834 lr: 5.26e-05 mem: 47% pow: 651.047 W 0: INFO 26-04-29 07:10:20.752942 - 5:52:49 - step: 14690 acc: 0 loss: 1.925 grad: 1.56e-01 flops: 3.91e+14 wps: 4.53e+04 iter: 0.6187 data: 0.0705 lr: 5.25e-05 mem: 47% pow: 660.799 W 0: INFO 26-04-29 07:10:34.833960 - 5:53:03 - step: 14700 acc: 0 loss: 1.4569 grad: 1.67e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.7869 data: 0.0731 lr: 5.25e-05 mem: 47% pow: 550.204 W 0: INFO 26-04-29 07:10:51.686836 - 5:53:20 - step: 14710 acc: 0 loss: 1.3459 grad: 1.58e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6181 data: 0.0708 lr: 5.25e-05 mem: 54% pow: 667.184 W 0: INFO 26-04-29 07:11:05.861673 - 5:53:34 - step: 14720 acc: 0 loss: 1.603 grad: 1.60e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.604 data: 0.0837 lr: 5.25e-05 mem: 47% pow: 659.376 W 0: INFO 26-04-29 07:11:19.886713 - 5:53:48 - step: 14730 acc: 0 loss: 1.7893 grad: 1.59e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6089 data: 0.0694 lr: 5.25e-05 mem: 47% pow: 657.816 W 0: INFO 26-04-29 07:11:34.186590 - 5:54:02 - step: 14740 acc: 0 loss: 1.8547 grad: 1.63e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6342 data: 0.0783 lr: 5.25e-05 mem: 47% pow: 639.573 W 0: INFO 26-04-29 07:11:48.276288 - 5:54:16 - step: 14750 acc: 0 loss: 1.7009 grad: 1.62e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6041 data: 0.0719 lr: 5.25e-05 mem: 47% pow: 665.484 W 0: INFO 26-04-29 07:12:02.118045 - 5:54:30 - step: 14760 acc: 0 loss: 1.7172 grad: 1.53e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6668 data: 0.0736 lr: 5.24e-05 mem: 47% pow: 631.208 W 0: INFO 26-04-29 07:12:16.340254 - 5:54:44 - step: 14770 acc: 0 loss: 1.654 grad: 1.57e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6222 data: 0.075 lr: 5.24e-05 mem: 47% pow: 638.999 W 0: INFO 26-04-29 07:12:31.271851 - 5:54:59 - step: 14780 acc: 0 loss: 1.4046 grad: 1.63e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.7555 data: 0.0715 lr: 5.24e-05 mem: 47% pow: 585.276 W 0: INFO 26-04-29 07:12:45.337793 - 5:55:13 - step: 14790 acc: 0 loss: 1.7987 grad: 1.76e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6168 data: 0.066 lr: 5.24e-05 mem: 47% pow: 645.487 W 0: INFO 26-04-29 07:12:59.713321 - 5:55:28 - step: 14800 acc: 0 loss: 1.7251 grad: 1.60e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.5966 data: 0.0769 lr: 5.24e-05 mem: 47% pow: 656.713 W 0: INFO 26-04-29 07:13:16.561412 - 5:55:45 - step: 14810 acc: 0 loss: 1.5755 grad: 1.62e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.9367 data: 0.0026 lr: 5.24e-05 mem: 54% pow: 504.602 W 0: INFO 26-04-29 07:13:31.016792 - 5:55:59 - step: 14820 acc: 0 loss: 1.7877 grad: 1.61e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6283 data: 0.0721 lr: 5.23e-05 mem: 47% pow: 643.329 W 0: INFO 26-04-29 07:13:44.999508 - 5:56:13 - step: 14830 acc: 0 loss: 1.4631 grad: 1.68e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6696 data: 0.0155 lr: 5.23e-05 mem: 47% pow: 653.791 W 0: INFO 26-04-29 07:13:59.234458 - 5:56:27 - step: 14840 acc: 0 loss: 1.7815 grad: 1.63e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6599 data: 0.0528 lr: 5.23e-05 mem: 47% pow: 638.688 W 0: INFO 26-04-29 07:14:13.506763 - 5:56:42 - step: 14850 acc: 0 loss: 1.7215 grad: 1.80e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6347 data: 0.0753 lr: 5.23e-05 mem: 47% pow: 638.956 W 0: INFO 26-04-29 07:14:27.985773 - 5:56:56 - step: 14860 acc: 0 loss: 1.793 grad: 1.70e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6314 data: 0.0406 lr: 5.23e-05 mem: 47% pow: 661.873 W 0: INFO 26-04-29 07:14:42.153995 - 5:57:10 - step: 14870 acc: 0 loss: 1.7708 grad: 1.62e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5992 data: 0.0716 lr: 5.23e-05 mem: 47% pow: 672.179 W 0: INFO 26-04-29 07:14:56.254632 - 5:57:24 - step: 14880 acc: 0 loss: 1.8777 grad: 1.67e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6325 data: 0.0654 lr: 5.23e-05 mem: 47% pow: 640.287 W 0: INFO 26-04-29 07:15:10.505687 - 5:57:39 - step: 14890 acc: 0 loss: 1.6352 grad: 1.57e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6217 data: 0.0661 lr: 5.22e-05 mem: 47% pow: 651.237 W 0: INFO 26-04-29 07:15:25.932677 - 5:57:54 - step: 14900 acc: 0 loss: 1.7415 grad: 1.61e-01 flops: 3.66e+14 wps: 4.25e+04 iter: 0.6452 data: 0.0674 lr: 5.22e-05 mem: 47% pow: 630.708 W 0: INFO 26-04-29 07:15:42.672040 - 5:58:11 - step: 14910 acc: 0 loss: 1.9713 grad: 1.55e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6307 data: 0.0818 lr: 5.22e-05 mem: 54% pow: 639.381 W 0: INFO 26-04-29 07:15:56.837492 - 5:58:25 - step: 14920 acc: 0 loss: 1.7593 grad: 1.54e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6305 data: 0.0691 lr: 5.22e-05 mem: 47% pow: 629.936 W 0: INFO 26-04-29 07:16:11.035748 - 5:58:39 - step: 14930 acc: 0 loss: 1.3948 grad: 1.57e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6545 data: 0.0596 lr: 5.22e-05 mem: 47% pow: 639.749 W 0: INFO 26-04-29 07:16:25.385486 - 5:58:53 - step: 14940 acc: 0 loss: 1.8411 grad: 1.70e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5769 data: 0.1135 lr: 5.22e-05 mem: 47% pow: 657.268 W 0: INFO 26-04-29 07:16:39.854922 - 5:59:08 - step: 14950 acc: 0 loss: 1.6648 grad: 1.60e-01 flops: 3.91e+14 wps: 4.53e+04 iter: 0.6246 data: 0.0632 lr: 5.22e-05 mem: 47% pow: 654.72 W 0: INFO 26-04-29 07:16:53.942712 - 5:59:22 - step: 14960 acc: 0 loss: 1.8665 grad: 1.64e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6132 data: 0.0691 lr: 5.21e-05 mem: 47% pow: 651.89 W 0: INFO 26-04-29 07:17:08.225636 - 5:59:36 - step: 14970 acc: 0 loss: 1.8675 grad: 1.61e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6112 data: 0.0773 lr: 5.21e-05 mem: 47% pow: 651.415 W 0: INFO 26-04-29 07:17:22.399227 - 5:59:50 - step: 14980 acc: 0 loss: 1.8668 grad: 1.61e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6589 data: 0.064 lr: 5.21e-05 mem: 47% pow: 630.886 W 0: INFO 26-04-29 07:17:36.255762 - 6:00:04 - step: 14990 acc: 0 loss: 1.9649 grad: 1.62e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6057 data: 0.0725 lr: 5.21e-05 mem: 47% pow: 656.37 W 0: INFO 26-04-29 07:17:50.355398 - 6:00:18 - step: 15000 acc: 0 loss: 1.6626 grad: 1.52e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6269 data: 0.0691 lr: 5.21e-05 mem: 47% pow: 647.114 W 0: INFO 26-04-29 07:17:50.358495 - 6:00:18 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000 0: INFO 26-04-29 07:17:50.359307 - 6:00:18 - Saving... 0: INFO 26-04-29 07:17:56.664677 - 6:00:25 - State dict saved! 0: INFO 26-04-29 07:17:56.749086 - 6:00:25 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000/train_state_00000.json 0: INFO 26-04-29 07:17:56.753248 - 6:00:25 - Train state saved ! 0: INFO 26-04-29 07:17:56.753680 - 6:00:25 - Cleaning up checkpoints... 0: INFO 26-04-29 07:17:56.753887 - 6:00:25 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000010000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000')] 0: INFO 26-04-29 07:17:56.754033 - 6:00:25 - Eval folders: [] 0: INFO 26-04-29 07:17:56.754161 - 6:00:25 - Other folders: [] 0: INFO 26-04-29 07:17:56.754313 - 6:00:25 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000010000')} 0: INFO 26-04-29 07:18:00.964156 - 6:00:29 - garbage collection 0: INFO 26-04-29 07:18:15.988134 - 6:00:44 - step: 15010 acc: 0 loss: 1.7128 grad: 1.63e-01 flops: 2.21e+14 wps: 2.56e+04 iter: 0.6961 data: 0.0653 lr: 5.21e-05 mem: 54% pow: 606.652 W 0: INFO 26-04-29 07:18:30.101840 - 6:00:58 - step: 15020 acc: 0 loss: 1.9847 grad: 1.64e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6398 data: 0.0679 lr: 5.21e-05 mem: 47% pow: 639.174 W 0: INFO 26-04-29 07:18:44.621993 - 6:01:13 - step: 15030 acc: 0 loss: 1.5004 grad: 1.67e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.9042 data: 0.0735 lr: 5.20e-05 mem: 47% pow: 488.1 W 0: INFO 26-04-29 07:18:58.978060 - 6:01:27 - step: 15040 acc: 0 loss: 2.2173 grad: 1.73e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.8343 data: 0.0679 lr: 5.20e-05 mem: 47% pow: 540.316 W 0: INFO 26-04-29 07:19:13.192355 - 6:01:41 - step: 15050 acc: 0 loss: 1.6589 grad: 1.56e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.602 data: 0.0732 lr: 5.20e-05 mem: 47% pow: 660.184 W 0: INFO 26-04-29 07:19:27.399203 - 6:01:55 - step: 15060 acc: 0 loss: 1.3945 grad: 1.66e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6106 data: 0.0714 lr: 5.20e-05 mem: 47% pow: 649.383 W 0: INFO 26-04-29 07:19:41.524157 - 6:02:10 - step: 15070 acc: 0 loss: 1.9008 grad: 1.63e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.625 data: 0.078 lr: 5.20e-05 mem: 47% pow: 644.648 W 0: INFO 26-04-29 07:19:55.758092 - 6:02:24 - step: 15080 acc: 0 loss: 1.9919 grad: 1.70e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6396 data: 0.0679 lr: 5.20e-05 mem: 47% pow: 648.495 W 0: INFO 26-04-29 07:20:10.821910 - 6:02:39 - step: 15090 acc: 0 loss: 1.6773 grad: 1.54e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.6909 data: 0.0732 lr: 5.19e-05 mem: 47% pow: 606.245 W 0: INFO 26-04-29 07:20:24.982768 - 6:02:53 - step: 15100 acc: 0 loss: 1.949 grad: 1.59e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6094 data: 0.0936 lr: 5.19e-05 mem: 47% pow: 636.345 W 0: INFO 26-04-29 07:20:42.111755 - 6:03:10 - step: 15110 acc: 0 loss: 1.7839 grad: 1.58e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.7483 data: 0.0778 lr: 5.19e-05 mem: 54% pow: 575.424 W 0: INFO 26-04-29 07:20:55.982685 - 6:03:24 - step: 15120 acc: 0 loss: 1.7679 grad: 1.51e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6296 data: 0.0708 lr: 5.19e-05 mem: 47% pow: 636.295 W 0: INFO 26-04-29 07:21:09.865199 - 6:03:38 - step: 15130 acc: 0 loss: 1.7474 grad: 1.75e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6229 data: 0.0806 lr: 5.19e-05 mem: 47% pow: 638.969 W 0: INFO 26-04-29 07:21:23.967336 - 6:03:52 - step: 15140 acc: 0 loss: 1.6251 grad: 1.56e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.5995 data: 0.0734 lr: 5.19e-05 mem: 47% pow: 670.4 W 0: INFO 26-04-29 07:21:37.725382 - 6:04:06 - step: 15150 acc: 0 loss: 1.6 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6174 data: 0.0786 lr: 5.19e-05 mem: 47% pow: 661.786 W 0: INFO 26-04-29 07:21:51.684921 - 6:04:20 - step: 15160 acc: 0 loss: 1.6273 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6157 data: 0.07 lr: 5.18e-05 mem: 47% pow: 655.63 W 0: INFO 26-04-29 07:22:05.761411 - 6:04:34 - step: 15170 acc: 0 loss: 2.0986 grad: 1.63e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6484 data: 0.056 lr: 5.18e-05 mem: 47% pow: 644.364 W 0: INFO 26-04-29 07:22:19.729784 - 6:04:48 - step: 15180 acc: 0 loss: 1.925 grad: 1.69e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6019 data: 0.0681 lr: 5.18e-05 mem: 47% pow: 667.783 W 0: INFO 26-04-29 07:22:33.334283 - 6:05:01 - step: 15190 acc: 0 loss: 2.1051 grad: 3.16e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6319 data: 0.0643 lr: 5.18e-05 mem: 47% pow: 642.505 W 0: INFO 26-04-29 07:22:47.273309 - 6:05:15 - step: 15200 acc: 0 loss: 1.5995 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6866 data: 0.0663 lr: 5.18e-05 mem: 47% pow: 617.54 W 0: INFO 26-04-29 07:23:04.095857 - 6:05:32 - step: 15210 acc: 0 loss: 1.7247 grad: 1.54e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6412 data: 0.0724 lr: 5.18e-05 mem: 54% pow: 635.698 W 0: INFO 26-04-29 07:23:18.151085 - 6:05:46 - step: 15220 acc: 0 loss: 1.7173 grad: 1.60e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.745 data: 0.0028 lr: 5.18e-05 mem: 47% pow: 617.503 W 0: INFO 26-04-29 07:23:32.523398 - 6:06:01 - step: 15230 acc: 0 loss: 1.868 grad: 1.57e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6416 data: 0.0667 lr: 5.17e-05 mem: 47% pow: 638.708 W 0: INFO 26-04-29 07:23:46.547389 - 6:06:15 - step: 15240 acc: 0 loss: 1.6389 grad: 1.59e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6425 data: 0.0703 lr: 5.17e-05 mem: 47% pow: 634.203 W 0: INFO 26-04-29 07:24:00.203181 - 6:06:28 - step: 15250 acc: 0 loss: 1.7409 grad: 1.61e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6187 data: 0.0635 lr: 5.17e-05 mem: 47% pow: 653.523 W 0: INFO 26-04-29 07:24:14.347658 - 6:06:42 - step: 15260 acc: 0 loss: 1.5402 grad: 1.72e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6077 data: 0.069 lr: 5.17e-05 mem: 47% pow: 664.824 W 0: INFO 26-04-29 07:24:28.494945 - 6:06:57 - step: 15270 acc: 0 loss: 1.6816 grad: 1.66e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6449 data: 0.0738 lr: 5.17e-05 mem: 47% pow: 627.544 W 0: INFO 26-04-29 07:24:42.489232 - 6:07:11 - step: 15280 acc: 0 loss: 1.6026 grad: 1.65e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6141 data: 0.0741 lr: 5.17e-05 mem: 47% pow: 652.348 W 0: INFO 26-04-29 07:24:56.600591 - 6:07:25 - step: 15290 acc: 0 loss: 1.8126 grad: 1.65e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5785 data: 0.3306 lr: 5.16e-05 mem: 47% pow: 533.074 W 0: INFO 26-04-29 07:25:10.371721 - 6:07:38 - step: 15300 acc: 0 loss: 1.7996 grad: 1.70e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6359 data: 0.078 lr: 5.16e-05 mem: 47% pow: 633.349 W 0: INFO 26-04-29 07:25:27.246634 - 6:07:55 - step: 15310 acc: 0 loss: 1.8623 grad: 1.52e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6355 data: 0.0677 lr: 5.16e-05 mem: 54% pow: 639.158 W 0: INFO 26-04-29 07:25:41.299924 - 6:08:09 - step: 15320 acc: 0 loss: 1.4274 grad: 1.61e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6279 data: 0.059 lr: 5.16e-05 mem: 47% pow: 658.926 W 0: INFO 26-04-29 07:25:54.992179 - 6:08:23 - step: 15330 acc: 0 loss: 1.7855 grad: 1.53e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6165 data: 0.078 lr: 5.16e-05 mem: 47% pow: 644.235 W 0: INFO 26-04-29 07:26:09.032464 - 6:08:37 - step: 15340 acc: 0 loss: 1.4921 grad: 1.80e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6407 data: 0.047 lr: 5.16e-05 mem: 47% pow: 655.981 W 0: INFO 26-04-29 07:26:23.006371 - 6:08:51 - step: 15350 acc: 0 loss: 1.6535 grad: 1.66e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6501 data: 0.0538 lr: 5.16e-05 mem: 47% pow: 642.097 W 0: INFO 26-04-29 07:26:36.980040 - 6:09:05 - step: 15360 acc: 0 loss: 1.8554 grad: 1.60e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6337 data: 0.0635 lr: 5.15e-05 mem: 47% pow: 643.69 W 0: INFO 26-04-29 07:26:51.496417 - 6:09:20 - step: 15370 acc: 0 loss: 2.0562 grad: 1.64e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6344 data: 0.0625 lr: 5.15e-05 mem: 47% pow: 651.054 W 0: INFO 26-04-29 07:27:05.525316 - 6:09:34 - step: 15380 acc: 0 loss: 1.6438 grad: 1.88e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6524 data: 0.0718 lr: 5.15e-05 mem: 47% pow: 632.77 W 0: INFO 26-04-29 07:27:19.681983 - 6:09:48 - step: 15390 acc: 0 loss: 1.7025 grad: 1.60e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6551 data: 0.0436 lr: 5.15e-05 mem: 47% pow: 645.762 W 0: INFO 26-04-29 07:27:34.058624 - 6:10:02 - step: 15400 acc: 0 loss: 1.8057 grad: 1.70e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6436 data: 0.056 lr: 5.15e-05 mem: 47% pow: 640.454 W 0: INFO 26-04-29 07:27:50.589802 - 6:10:19 - step: 15410 acc: 0 loss: 1.87 grad: 1.57e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6073 data: 0.066 lr: 5.15e-05 mem: 54% pow: 661.631 W 0: INFO 26-04-29 07:28:04.399910 - 6:10:32 - step: 15420 acc: 0 loss: 1.592 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6257 data: 0.0798 lr: 5.15e-05 mem: 47% pow: 635.983 W 0: INFO 26-04-29 07:28:18.608617 - 6:10:47 - step: 15430 acc: 0 loss: 1.5595 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6347 data: 0.0638 lr: 5.14e-05 mem: 47% pow: 637.775 W 0: INFO 26-04-29 07:28:32.512409 - 6:11:01 - step: 15440 acc: 0 loss: 1.917 grad: 1.55e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6403 data: 0.0654 lr: 5.14e-05 mem: 47% pow: 644.85 W 0: INFO 26-04-29 07:28:47.135012 - 6:11:15 - step: 15450 acc: 0 loss: 1.5189 grad: 1.60e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6272 data: 0.0746 lr: 5.14e-05 mem: 47% pow: 640.47 W 0: INFO 26-04-29 07:29:00.745937 - 6:11:29 - step: 15460 acc: 0 loss: 1.6713 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6242 data: 0.0659 lr: 5.14e-05 mem: 47% pow: 648.97 W 0: INFO 26-04-29 07:29:14.639502 - 6:11:43 - step: 15470 acc: 0 loss: 1.8028 grad: 1.63e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.62 data: 0.0737 lr: 5.14e-05 mem: 47% pow: 660.975 W 0: INFO 26-04-29 07:29:28.761840 - 6:11:57 - step: 15480 acc: 0 loss: 1.6023 grad: 1.55e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.666 data: 0.0706 lr: 5.14e-05 mem: 47% pow: 621.045 W 0: INFO 26-04-29 07:29:42.677294 - 6:12:11 - step: 15490 acc: 0 loss: 1.6784 grad: 1.58e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6249 data: 0.0569 lr: 5.14e-05 mem: 47% pow: 652.243 W 0: INFO 26-04-29 07:29:56.849650 - 6:12:25 - step: 15500 acc: 0 loss: 1.6646 grad: 1.66e-01 flops: 3.98e+14 wps: 4.63e+04 iter: 0.5944 data: 0.0816 lr: 5.13e-05 mem: 47% pow: 661.166 W 0: INFO 26-04-29 07:30:13.721663 - 6:12:42 - step: 15510 acc: 0 loss: 1.8445 grad: 1.74e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.599 data: 0.0968 lr: 5.13e-05 mem: 54% pow: 654.008 W 0: INFO 26-04-29 07:30:27.866482 - 6:12:56 - step: 15520 acc: 0 loss: 1.5732 grad: 1.61e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6175 data: 0.0713 lr: 5.13e-05 mem: 47% pow: 652.685 W 0: INFO 26-04-29 07:30:41.724779 - 6:13:10 - step: 15530 acc: 0 loss: 1.7862 grad: 1.54e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6191 data: 0.0708 lr: 5.13e-05 mem: 47% pow: 655.442 W 0: INFO 26-04-29 07:30:55.602815 - 6:13:24 - step: 15540 acc: 0 loss: 1.8246 grad: 1.60e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6826 data: 0.0359 lr: 5.13e-05 mem: 47% pow: 633.951 W 0: INFO 26-04-29 07:31:09.311830 - 6:13:37 - step: 15550 acc: 0 loss: 1.6521 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6389 data: 0.0769 lr: 5.13e-05 mem: 47% pow: 636.696 W 0: INFO 26-04-29 07:31:23.294284 - 6:13:51 - step: 15560 acc: 0 loss: 1.6794 grad: 1.65e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6096 data: 0.1205 lr: 5.12e-05 mem: 47% pow: 626.69 W 0: INFO 26-04-29 07:31:37.501559 - 6:14:06 - step: 15570 acc: 0 loss: 1.5066 grad: 1.51e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6687 data: 0.0706 lr: 5.12e-05 mem: 47% pow: 614.146 W 0: INFO 26-04-29 07:31:51.353754 - 6:14:19 - step: 15580 acc: 0 loss: 1.6462 grad: 1.62e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6389 data: 0.0605 lr: 5.12e-05 mem: 47% pow: 644.889 W 0: INFO 26-04-29 07:32:05.222695 - 6:14:33 - step: 15590 acc: 0 loss: 1.6705 grad: 1.73e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6072 data: 0.0747 lr: 5.12e-05 mem: 47% pow: 653.703 W 0: INFO 26-04-29 07:32:19.042689 - 6:14:47 - step: 15600 acc: 0 loss: 1.5907 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6864 data: 0.0121 lr: 5.12e-05 mem: 47% pow: 651.73 W 0: INFO 26-04-29 07:32:35.989943 - 6:15:04 - step: 15610 acc: 0 loss: 1.5937 grad: 1.70e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.7778 data: 0.0672 lr: 5.12e-05 mem: 54% pow: 563.677 W 0: INFO 26-04-29 07:32:50.571268 - 6:15:19 - step: 15620 acc: 0 loss: 2.0002 grad: 1.57e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.6642 data: 0.0697 lr: 5.12e-05 mem: 47% pow: 624.946 W 0: INFO 26-04-29 07:33:04.700629 - 6:15:33 - step: 15630 acc: 0 loss: 1.627 grad: 1.85e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.8441 data: 0.0723 lr: 5.11e-05 mem: 47% pow: 522.451 W 0: INFO 26-04-29 07:33:18.380257 - 6:15:46 - step: 15640 acc: 0 loss: 1.6963 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.668 data: 0.0368 lr: 5.11e-05 mem: 47% pow: 647.018 W 0: INFO 26-04-29 07:33:32.213950 - 6:16:00 - step: 15650 acc: 0 loss: 1.744 grad: 1.66e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6387 data: 0.0769 lr: 5.11e-05 mem: 47% pow: 635.628 W 0: INFO 26-04-29 07:33:46.127002 - 6:16:14 - step: 15660 acc: 0 loss: 1.4374 grad: 1.84e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6192 data: 0.0697 lr: 5.11e-05 mem: 47% pow: 654.201 W 0: INFO 26-04-29 07:34:00.269441 - 6:16:28 - step: 15670 acc: 0 loss: 1.582 grad: 1.60e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6938 data: 0.0414 lr: 5.11e-05 mem: 47% pow: 619.97 W 0: INFO 26-04-29 07:34:14.153341 - 6:16:42 - step: 15680 acc: 0 loss: 1.7667 grad: 1.55e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.649 data: 0.0687 lr: 5.11e-05 mem: 47% pow: 630.071 W 0: INFO 26-04-29 07:34:27.918771 - 6:16:56 - step: 15690 acc: 0 loss: 1.9265 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6371 data: 0.0655 lr: 5.11e-05 mem: 47% pow: 639.501 W 0: INFO 26-04-29 07:34:41.970498 - 6:17:10 - step: 15700 acc: 0 loss: 1.6996 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.604 data: 0.0787 lr: 5.10e-05 mem: 47% pow: 649.729 W 0: INFO 26-04-29 07:34:58.955016 - 6:17:27 - step: 15710 acc: 0 loss: 1.867 grad: 1.61e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.734 data: 0.006 lr: 5.10e-05 mem: 54% pow: 616.605 W 0: INFO 26-04-29 07:35:12.847827 - 6:17:41 - step: 15720 acc: 0 loss: 1.7096 grad: 1.58e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6111 data: 0.0978 lr: 5.10e-05 mem: 47% pow: 647.07 W 0: INFO 26-04-29 07:35:26.839237 - 6:17:55 - step: 15730 acc: 0 loss: 1.8659 grad: 1.75e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6446 data: 0.0607 lr: 5.10e-05 mem: 47% pow: 639.758 W 0: INFO 26-04-29 07:35:40.753250 - 6:18:09 - step: 15740 acc: 0 loss: 1.7297 grad: 1.51e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.613 data: 0.0814 lr: 5.10e-05 mem: 47% pow: 652.111 W 0: INFO 26-04-29 07:35:54.537958 - 6:18:23 - step: 15750 acc: 0 loss: 1.6667 grad: 1.77e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6097 data: 0.0706 lr: 5.10e-05 mem: 47% pow: 648.603 W 0: INFO 26-04-29 07:36:08.445799 - 6:18:37 - step: 15760 acc: 0 loss: 1.7745 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.593 data: 0.0955 lr: 5.10e-05 mem: 47% pow: 656.726 W 0: INFO 26-04-29 07:36:22.291296 - 6:18:50 - step: 15770 acc: 0 loss: 1.9179 grad: 1.74e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.632 data: 0.0565 lr: 5.09e-05 mem: 47% pow: 654.811 W 0: INFO 26-04-29 07:36:36.491729 - 6:19:05 - step: 15780 acc: 0 loss: 2.0298 grad: 1.59e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6057 data: 0.0728 lr: 5.09e-05 mem: 47% pow: 653.14 W 0: INFO 26-04-29 07:36:50.832642 - 6:19:19 - step: 15790 acc: 0 loss: 1.966 grad: 1.64e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5892 data: 0.0996 lr: 5.09e-05 mem: 47% pow: 653.357 W 0: INFO 26-04-29 07:37:04.934505 - 6:19:33 - step: 15800 acc: 0 loss: 1.8522 grad: 1.62e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6411 data: 0.0799 lr: 5.09e-05 mem: 47% pow: 621.414 W 0: INFO 26-04-29 07:37:21.851301 - 6:19:50 - step: 15810 acc: 0 loss: 1.5864 grad: 1.56e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6061 data: 0.0659 lr: 5.09e-05 mem: 54% pow: 660.048 W 0: INFO 26-04-29 07:37:35.757034 - 6:20:04 - step: 15820 acc: 0 loss: 1.4824 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6425 data: 0.0614 lr: 5.09e-05 mem: 47% pow: 636.277 W 0: INFO 26-04-29 07:37:49.685900 - 6:20:18 - step: 15830 acc: 0 loss: 1.6873 grad: 1.65e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6461 data: 0.0554 lr: 5.08e-05 mem: 47% pow: 646.645 W 0: INFO 26-04-29 07:38:04.233284 - 6:20:32 - step: 15840 acc: 0 loss: 2.02 grad: 1.56e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.6242 data: 0.0735 lr: 5.08e-05 mem: 47% pow: 645.18 W 0: INFO 26-04-29 07:38:18.385324 - 6:20:46 - step: 15850 acc: 0 loss: 1.7167 grad: 1.56e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6396 data: 0.0511 lr: 5.08e-05 mem: 47% pow: 650.892 W 0: INFO 26-04-29 07:38:32.083129 - 6:21:00 - step: 15860 acc: 0 loss: 1.4277 grad: 1.52e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.645 data: 0.0612 lr: 5.08e-05 mem: 47% pow: 644.936 W 0: INFO 26-04-29 07:38:45.844772 - 6:21:14 - step: 15870 acc: 0 loss: 1.7279 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6365 data: 0.0747 lr: 5.08e-05 mem: 47% pow: 635.443 W 0: INFO 26-04-29 07:39:00.119003 - 6:21:28 - step: 15880 acc: 0 loss: 1.8363 grad: 1.64e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.62 data: 0.0856 lr: 5.08e-05 mem: 47% pow: 651.627 W 0: INFO 26-04-29 07:39:15.702029 - 6:21:44 - step: 15890 acc: 0 loss: 2.0334 grad: 1.47e-01 flops: 3.62e+14 wps: 4.21e+04 iter: 0.6238 data: 0.0864 lr: 5.08e-05 mem: 47% pow: 643.851 W 0: INFO 26-04-29 07:39:29.753882 - 6:21:58 - step: 15900 acc: 0 loss: 1.7271 grad: 1.55e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6549 data: 0.0372 lr: 5.07e-05 mem: 47% pow: 643.67 W 0: INFO 26-04-29 07:39:46.866338 - 6:22:15 - step: 15910 acc: 0 loss: 2.0606 grad: 1.57e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.5874 data: 0.0857 lr: 5.07e-05 mem: 54% pow: 656.39 W 0: INFO 26-04-29 07:40:00.640937 - 6:22:29 - step: 15920 acc: 0 loss: 1.5101 grad: 1.73e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6614 data: 0.0707 lr: 5.07e-05 mem: 47% pow: 627.758 W 0: INFO 26-04-29 07:40:14.409213 - 6:22:42 - step: 15930 acc: 0 loss: 2.094 grad: 1.59e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6038 data: 0.0789 lr: 5.07e-05 mem: 47% pow: 655.52 W 0: INFO 26-04-29 07:40:28.060315 - 6:22:56 - step: 15940 acc: 0 loss: 1.8176 grad: 1.75e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6252 data: 0.0755 lr: 5.07e-05 mem: 47% pow: 640.293 W 0: INFO 26-04-29 07:40:42.016580 - 6:23:10 - step: 15950 acc: 0 loss: 1.8906 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6356 data: 0.0648 lr: 5.07e-05 mem: 47% pow: 648.207 W 0: INFO 26-04-29 07:40:55.669666 - 6:23:24 - step: 15960 acc: 0 loss: 1.7772 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6469 data: 0.0857 lr: 5.07e-05 mem: 47% pow: 632.956 W 0: INFO 26-04-29 07:41:10.002781 - 6:23:38 - step: 15970 acc: 0 loss: 1.8913 grad: 1.54e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6468 data: 0.054 lr: 5.06e-05 mem: 47% pow: 660.06 W 0: INFO 26-04-29 07:41:24.001482 - 6:23:52 - step: 15980 acc: 0 loss: 1.6972 grad: 1.55e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6261 data: 0.0629 lr: 5.06e-05 mem: 47% pow: 655.351 W 0: INFO 26-04-29 07:41:37.881936 - 6:24:06 - step: 15990 acc: 0 loss: 1.633 grad: 1.66e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6576 data: 0.0621 lr: 5.06e-05 mem: 47% pow: 630.493 W 0: INFO 26-04-29 07:41:51.662480 - 6:24:20 - step: 16000 acc: 0 loss: 1.6423 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6406 data: 0.0671 lr: 5.06e-05 mem: 47% pow: 642.965 W 0: INFO 26-04-29 07:41:55.319291 - 6:24:23 - garbage collection 0: INFO 26-04-29 07:42:10.055823 - 6:24:38 - step: 16010 acc: 0 loss: 1.2583 grad: 1.56e-01 flops: 3.07e+14 wps: 3.56e+04 iter: 0.6254 data: 0.0759 lr: 5.06e-05 mem: 54% pow: 634.923 W 0: INFO 26-04-29 07:42:24.124201 - 6:24:52 - step: 16020 acc: 0 loss: 1.4498 grad: 1.62e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6738 data: 0.0712 lr: 5.06e-05 mem: 47% pow: 622.053 W 0: INFO 26-04-29 07:42:38.355034 - 6:25:06 - step: 16030 acc: 0 loss: 1.5728 grad: 1.77e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6176 data: 0.075 lr: 5.05e-05 mem: 47% pow: 646.73 W 0: INFO 26-04-29 07:42:52.503053 - 6:25:21 - step: 16040 acc: 0 loss: 1.4045 grad: 1.46e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.67 data: 0.07 lr: 5.05e-05 mem: 47% pow: 613.703 W 0: INFO 26-04-29 07:43:06.485360 - 6:25:35 - step: 16050 acc: 0 loss: 1.6817 grad: 1.60e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6124 data: 0.0698 lr: 5.05e-05 mem: 47% pow: 659.163 W 0: INFO 26-04-29 07:43:20.758533 - 6:25:49 - step: 16060 acc: 0 loss: 1.8333 grad: 1.53e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.7404 data: 0.0849 lr: 5.05e-05 mem: 47% pow: 575.236 W 0: INFO 26-04-29 07:43:34.630537 - 6:26:03 - step: 16070 acc: 0 loss: 1.7233 grad: 1.63e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6493 data: 0.0661 lr: 5.05e-05 mem: 47% pow: 626.706 W 0: INFO 26-04-29 07:43:48.629758 - 6:26:17 - step: 16080 acc: 0 loss: 1.4844 grad: 1.54e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6073 data: 0.0697 lr: 5.05e-05 mem: 47% pow: 654.802 W 0: INFO 26-04-29 07:44:02.464483 - 6:26:31 - step: 16090 acc: 0 loss: 1.5945 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6301 data: 0.0616 lr: 5.05e-05 mem: 47% pow: 657.145 W 0: INFO 26-04-29 07:44:16.289284 - 6:26:44 - step: 16100 acc: 0 loss: 1.4813 grad: 1.49e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.609 data: 0.0782 lr: 5.04e-05 mem: 47% pow: 652.053 W 0: INFO 26-04-29 07:44:33.046565 - 6:27:01 - step: 16110 acc: 0 loss: 1.5054 grad: 1.56e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6343 data: 0.0668 lr: 5.04e-05 mem: 54% pow: 649.19 W 0: INFO 26-04-29 07:44:46.861218 - 6:27:15 - step: 16120 acc: 0 loss: 1.7822 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6129 data: 0.0751 lr: 5.04e-05 mem: 47% pow: 654.159 W 0: INFO 26-04-29 07:45:00.857349 - 6:27:29 - step: 16130 acc: 0 loss: 1.718 grad: 1.61e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6171 data: 0.0873 lr: 5.04e-05 mem: 47% pow: 645.299 W 0: INFO 26-04-29 07:45:14.904739 - 6:27:43 - step: 16140 acc: 0 loss: 1.8891 grad: 1.52e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6288 data: 0.0735 lr: 5.04e-05 mem: 47% pow: 641.373 W 0: INFO 26-04-29 07:45:28.946591 - 6:27:57 - step: 16150 acc: 0 loss: 1.5846 grad: 1.55e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6396 data: 0.0564 lr: 5.04e-05 mem: 47% pow: 655.526 W 0: INFO 26-04-29 07:45:42.937316 - 6:28:11 - step: 16160 acc: 0 loss: 1.4834 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6439 data: 0.0611 lr: 5.04e-05 mem: 47% pow: 640.891 W 0: INFO 26-04-29 07:45:57.048163 - 6:28:25 - step: 16170 acc: 0 loss: 1.799 grad: 1.73e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6878 data: 0.0666 lr: 5.03e-05 mem: 47% pow: 621.929 W 0: INFO 26-04-29 07:46:10.983897 - 6:28:39 - step: 16180 acc: 0 loss: 1.4135 grad: 1.74e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6129 data: 0.0714 lr: 5.03e-05 mem: 47% pow: 656.64 W 0: INFO 26-04-29 07:46:24.819223 - 6:28:53 - step: 16190 acc: 0 loss: 1.9494 grad: 1.70e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6207 data: 0.0766 lr: 5.03e-05 mem: 47% pow: 642.278 W 0: INFO 26-04-29 07:46:39.057096 - 6:29:07 - step: 16200 acc: 0 loss: 1.6373 grad: 1.50e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.63 data: 0.0554 lr: 5.03e-05 mem: 47% pow: 662.312 W 0: INFO 26-04-29 07:46:56.444225 - 6:29:25 - step: 16210 acc: 0 loss: 1.5083 grad: 1.63e-01 flops: 3.25e+14 wps: 3.77e+04 iter: 0.6085 data: 0.0759 lr: 5.03e-05 mem: 54% pow: 651.06 W 0: INFO 26-04-29 07:47:10.687787 - 6:29:39 - step: 16220 acc: 0 loss: 1.6136 grad: 1.58e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6742 data: 0.061 lr: 5.03e-05 mem: 47% pow: 627.758 W 0: INFO 26-04-29 07:47:24.597669 - 6:29:53 - step: 16230 acc: 0 loss: 1.8047 grad: 1.61e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6036 data: 0.0839 lr: 5.03e-05 mem: 47% pow: 657.683 W 0: INFO 26-04-29 07:47:45.217177 - 6:30:13 - step: 16240 acc: 0 loss: 1.9384 grad: 1.54e-01 flops: 2.74e+14 wps: 3.18e+04 iter: 0.8662 data: 0.0783 lr: 5.02e-05 mem: 47% pow: 506.078 W 0: INFO 26-04-29 07:47:59.460419 - 6:30:28 - step: 16250 acc: 0 loss: 1.7358 grad: 1.57e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6197 data: 0.0784 lr: 5.02e-05 mem: 47% pow: 634.973 W 0: INFO 26-04-29 07:48:13.559179 - 6:30:42 - step: 16260 acc: 0 loss: 1.5131 grad: 1.63e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6481 data: 0.0371 lr: 5.02e-05 mem: 47% pow: 657.876 W 0: INFO 26-04-29 07:48:27.608967 - 6:30:56 - step: 16270 acc: 0 loss: 1.9229 grad: 1.58e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6135 data: 0.0733 lr: 5.02e-05 mem: 47% pow: 657.757 W 0: INFO 26-04-29 07:48:41.836211 - 6:31:10 - step: 16280 acc: 0 loss: 1.7769 grad: 1.50e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.8197 data: 0.0791 lr: 5.02e-05 mem: 47% pow: 537.299 W 0: INFO 26-04-29 07:48:55.877339 - 6:31:24 - step: 16290 acc: 0 loss: 1.8108 grad: 1.64e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6309 data: 0.0649 lr: 5.02e-05 mem: 47% pow: 644.823 W 0: INFO 26-04-29 07:49:10.033225 - 6:31:38 - step: 16300 acc: 0 loss: 1.5511 grad: 1.51e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6306 data: 0.0681 lr: 5.01e-05 mem: 47% pow: 638.331 W 0: INFO 26-04-29 07:49:26.878518 - 6:31:55 - step: 16310 acc: 0 loss: 1.6444 grad: 1.61e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.616 data: 0.0633 lr: 5.01e-05 mem: 54% pow: 652.211 W 0: INFO 26-04-29 07:49:40.948921 - 6:32:09 - step: 16320 acc: 0 loss: 1.8015 grad: 2.30e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6202 data: 0.0611 lr: 5.01e-05 mem: 47% pow: 665.535 W 0: INFO 26-04-29 07:49:54.876091 - 6:32:23 - step: 16330 acc: 0 loss: 1.8168 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7239 data: 0.0525 lr: 5.01e-05 mem: 47% pow: 598.639 W 0: INFO 26-04-29 07:50:08.994937 - 6:32:37 - step: 16340 acc: 0 loss: 1.8658 grad: 1.50e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6011 data: 0.0763 lr: 5.01e-05 mem: 47% pow: 655.939 W 0: INFO 26-04-29 07:50:23.131537 - 6:32:51 - step: 16350 acc: 0 loss: 1.4285 grad: 1.56e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6346 data: 0.0586 lr: 5.01e-05 mem: 47% pow: 648.997 W 0: INFO 26-04-29 07:50:37.157094 - 6:33:05 - step: 16360 acc: 0 loss: 1.6476 grad: 1.64e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6837 data: 0.0671 lr: 5.01e-05 mem: 47% pow: 618.708 W 0: INFO 26-04-29 07:50:51.305465 - 6:33:19 - step: 16370 acc: 0 loss: 1.7655 grad: 1.69e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6237 data: 0.0998 lr: 5.00e-05 mem: 47% pow: 646.39 W 0: INFO 26-04-29 07:51:05.313589 - 6:33:33 - step: 16380 acc: 0 loss: 1.7218 grad: 1.70e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6514 data: 0.0649 lr: 5.00e-05 mem: 47% pow: 637.361 W 0: INFO 26-04-29 07:51:19.408666 - 6:33:47 - step: 16390 acc: 0 loss: 1.5554 grad: 1.55e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6501 data: 0.067 lr: 5.00e-05 mem: 47% pow: 629.147 W 0: INFO 26-04-29 07:51:33.094621 - 6:34:01 - step: 16400 acc: 0 loss: 1.5746 grad: 1.70e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6298 data: 0.0678 lr: 5.00e-05 mem: 47% pow: 640.697 W 0: INFO 26-04-29 07:51:49.927267 - 6:34:18 - step: 16410 acc: 0 loss: 1.834 grad: 1.67e-01 flops: 3.36e+14 wps: 3.89e+04 iter: 0.6147 data: 0.0806 lr: 5.00e-05 mem: 54% pow: 645.407 W 0: INFO 26-04-29 07:52:03.874404 - 6:34:32 - step: 16420 acc: 0 loss: 1.6043 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6334 data: 0.0615 lr: 5.00e-05 mem: 47% pow: 650.386 W 0: INFO 26-04-29 07:52:17.729653 - 6:34:46 - step: 16430 acc: 0 loss: 1.5451 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6176 data: 0.0736 lr: 5.00e-05 mem: 47% pow: 659.257 W 0: INFO 26-04-29 07:52:31.922143 - 6:35:00 - step: 16440 acc: 0 loss: 1.7371 grad: 1.67e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6559 data: 0.0742 lr: 4.99e-05 mem: 47% pow: 628.402 W 0: INFO 26-04-29 07:52:45.848344 - 6:35:14 - step: 16450 acc: 0 loss: 1.7455 grad: 1.54e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6196 data: 0.0727 lr: 4.99e-05 mem: 47% pow: 643.712 W 0: INFO 26-04-29 07:52:59.758093 - 6:35:28 - step: 16460 acc: 0 loss: 1.4423 grad: 1.54e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6116 data: 0.0702 lr: 4.99e-05 mem: 47% pow: 649.576 W 0: INFO 26-04-29 07:53:13.842718 - 6:35:42 - step: 16470 acc: 0 loss: 1.75 grad: 1.64e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6314 data: 0.0752 lr: 4.99e-05 mem: 47% pow: 644.225 W 0: INFO 26-04-29 07:53:28.035798 - 6:35:56 - step: 16480 acc: 0 loss: 1.636 grad: 1.62e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.596 data: 0.1023 lr: 4.99e-05 mem: 47% pow: 631.374 W 0: INFO 26-04-29 07:53:41.689183 - 6:36:10 - step: 16490 acc: 0 loss: 1.8076 grad: 1.87e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6176 data: 0.0769 lr: 4.99e-05 mem: 47% pow: 667.798 W 0: INFO 26-04-29 07:53:55.639648 - 6:36:24 - step: 16500 acc: 0 loss: 2.0428 grad: 1.61e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6856 data: 0.0028 lr: 4.98e-05 mem: 47% pow: 650.989 W 0: INFO 26-04-29 07:54:12.379208 - 6:36:40 - step: 16510 acc: 0 loss: 1.5829 grad: 1.51e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6024 data: 0.0842 lr: 4.98e-05 mem: 54% pow: 650.073 W 0: INFO 26-04-29 07:54:26.560691 - 6:36:55 - step: 16520 acc: 0 loss: 1.6347 grad: 1.72e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6475 data: 0.0623 lr: 4.98e-05 mem: 47% pow: 639.916 W 0: INFO 26-04-29 07:54:40.340497 - 6:37:08 - step: 16530 acc: 0 loss: 1.5476 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6208 data: 0.0668 lr: 4.98e-05 mem: 47% pow: 653.961 W 0: INFO 26-04-29 07:54:54.358682 - 6:37:22 - step: 16540 acc: 0 loss: 2.0488 grad: 1.53e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6633 data: 0.0693 lr: 4.98e-05 mem: 47% pow: 628.501 W 0: INFO 26-04-29 07:55:08.172343 - 6:37:36 - step: 16550 acc: 0 loss: 1.4454 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6147 data: 0.0749 lr: 4.98e-05 mem: 47% pow: 656.054 W 0: INFO 26-04-29 07:55:22.082408 - 6:37:50 - step: 16560 acc: 0 loss: 1.5008 grad: 1.57e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6149 data: 0.0707 lr: 4.98e-05 mem: 47% pow: 656.847 W 0: INFO 26-04-29 07:55:35.749798 - 6:38:04 - step: 16570 acc: 0 loss: 1.802 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6309 data: 0.0671 lr: 4.97e-05 mem: 47% pow: 638.932 W 0: INFO 26-04-29 07:55:49.486060 - 6:38:18 - step: 16580 acc: 0 loss: 1.4906 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6233 data: 0.0607 lr: 4.97e-05 mem: 47% pow: 650.66 W 0: INFO 26-04-29 07:56:03.535393 - 6:38:32 - step: 16590 acc: 0 loss: 2.5157 grad: 1.51e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6097 data: 0.0734 lr: 4.97e-05 mem: 47% pow: 653.902 W 0: INFO 26-04-29 07:56:17.600460 - 6:38:46 - step: 16600 acc: 0 loss: 1.7842 grad: 1.51e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6047 data: 0.0835 lr: 4.97e-05 mem: 47% pow: 657.709 W 0: INFO 26-04-29 07:56:34.364630 - 6:39:02 - step: 16610 acc: 0 loss: 1.7846 grad: 1.57e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6308 data: 0.0749 lr: 4.97e-05 mem: 54% pow: 645.429 W 0: INFO 26-04-29 07:56:48.457549 - 6:39:17 - step: 16620 acc: 0 loss: 1.9117 grad: 1.77e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6148 data: 0.0671 lr: 4.97e-05 mem: 47% pow: 663.513 W 0: INFO 26-04-29 07:57:02.036514 - 6:39:30 - step: 16630 acc: 0 loss: 1.4891 grad: 1.64e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5993 data: 0.0796 lr: 4.97e-05 mem: 47% pow: 656.2 W 0: INFO 26-04-29 07:57:15.993333 - 6:39:44 - step: 16640 acc: 0 loss: 1.683 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6943 data: 0.0029 lr: 4.96e-05 mem: 47% pow: 639.045 W 0: INFO 26-04-29 07:57:30.149014 - 6:39:58 - step: 16650 acc: 0 loss: 1.3794 grad: 1.59e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6415 data: 0.0731 lr: 4.96e-05 mem: 47% pow: 633.525 W 0: INFO 26-04-29 07:57:44.401376 - 6:40:12 - step: 16660 acc: 0 loss: 1.6516 grad: 1.64e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6241 data: 0.0656 lr: 4.96e-05 mem: 47% pow: 652.256 W 0: INFO 26-04-29 07:57:58.019509 - 6:40:26 - step: 16670 acc: 0 loss: 1.4852 grad: 1.49e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6119 data: 0.0732 lr: 4.96e-05 mem: 47% pow: 660.139 W 0: INFO 26-04-29 07:58:12.220890 - 6:40:40 - step: 16680 acc: 0 loss: 1.7554 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6323 data: 0.0641 lr: 4.96e-05 mem: 47% pow: 657.995 W 0: INFO 26-04-29 07:58:26.208556 - 6:40:54 - step: 16690 acc: 0 loss: 1.7797 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6074 data: 0.0713 lr: 4.96e-05 mem: 47% pow: 648.207 W 0: INFO 26-04-29 07:58:40.032549 - 6:41:08 - step: 16700 acc: 0 loss: 1.6729 grad: 1.73e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6286 data: 0.062 lr: 4.96e-05 mem: 47% pow: 650.782 W 0: INFO 26-04-29 07:58:57.020802 - 6:41:25 - step: 16710 acc: 0 loss: 1.7068 grad: 1.52e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.6175 data: 0.0718 lr: 4.95e-05 mem: 54% pow: 645.492 W 0: INFO 26-04-29 07:59:10.999557 - 6:41:39 - step: 16720 acc: 0 loss: 1.4067 grad: 1.70e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.597 data: 0.0824 lr: 4.95e-05 mem: 47% pow: 656.479 W 0: INFO 26-04-29 07:59:25.146162 - 6:41:53 - step: 16730 acc: 0 loss: 1.3468 grad: 1.55e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6542 data: 0.0724 lr: 4.95e-05 mem: 47% pow: 630.266 W 0: INFO 26-04-29 07:59:38.807143 - 6:42:07 - step: 16740 acc: 0 loss: 1.8053 grad: 1.51e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6408 data: 0.0686 lr: 4.95e-05 mem: 47% pow: 639.046 W 0: INFO 26-04-29 07:59:52.470203 - 6:42:21 - step: 16750 acc: 0 loss: 1.6191 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6132 data: 0.0764 lr: 4.95e-05 mem: 47% pow: 651.705 W 0: INFO 26-04-29 08:00:06.721626 - 6:42:35 - step: 16760 acc: 0 loss: 1.2367 grad: 1.60e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5959 data: 0.0896 lr: 4.95e-05 mem: 47% pow: 652.494 W 0: INFO 26-04-29 08:00:20.449877 - 6:42:49 - step: 16770 acc: 0 loss: 1.6027 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6696 data: 0.0699 lr: 4.94e-05 mem: 47% pow: 621.797 W 0: INFO 26-04-29 08:00:34.198899 - 6:43:02 - step: 16780 acc: 0 loss: 1.6298 grad: 2.41e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6208 data: 0.0663 lr: 4.94e-05 mem: 47% pow: 651.309 W 0: INFO 26-04-29 08:00:48.656355 - 6:43:17 - step: 16790 acc: 0 loss: 1.7856 grad: 1.64e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6083 data: 0.072 lr: 4.94e-05 mem: 47% pow: 653.164 W 0: INFO 26-04-29 08:01:02.626832 - 6:43:31 - step: 16800 acc: 0 loss: 1.1818 grad: 1.65e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6454 data: 0.051 lr: 4.94e-05 mem: 47% pow: 649.773 W 0: INFO 26-04-29 08:01:19.806017 - 6:43:48 - step: 16810 acc: 0 loss: 1.5643 grad: 1.55e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6495 data: 0.0765 lr: 4.94e-05 mem: 54% pow: 638.604 W 0: INFO 26-04-29 08:01:33.871950 - 6:44:02 - step: 16820 acc: 0 loss: 1.7008 grad: 1.49e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6344 data: 0.0761 lr: 4.94e-05 mem: 47% pow: 654.534 W 0: INFO 26-04-29 08:01:47.582700 - 6:44:16 - step: 16830 acc: 0 loss: 1.571 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6507 data: 0.0595 lr: 4.94e-05 mem: 47% pow: 636.944 W 0: INFO 26-04-29 08:02:01.453455 - 6:44:30 - step: 16840 acc: 0 loss: 1.7207 grad: 1.49e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.638 data: 0.0516 lr: 4.93e-05 mem: 47% pow: 649.666 W 0: INFO 26-04-29 08:02:15.229010 - 6:44:43 - step: 16850 acc: 0 loss: 1.7949 grad: 1.76e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6099 data: 0.0716 lr: 4.93e-05 mem: 47% pow: 648.314 W 0: INFO 26-04-29 08:02:29.403927 - 6:44:57 - step: 16860 acc: 0 loss: 1.6403 grad: 1.60e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6612 data: 0.0706 lr: 4.93e-05 mem: 47% pow: 619.467 W 0: INFO 26-04-29 08:02:43.258765 - 6:45:11 - step: 16870 acc: 0 loss: 1.4487 grad: 1.61e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6199 data: 0.065 lr: 4.93e-05 mem: 47% pow: 653.378 W 0: INFO 26-04-29 08:02:57.116651 - 6:45:25 - step: 16880 acc: 0 loss: 1.6359 grad: 1.67e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6445 data: 0.0349 lr: 4.93e-05 mem: 47% pow: 653.768 W 0: INFO 26-04-29 08:03:10.913443 - 6:45:39 - step: 16890 acc: 0 loss: 1.3575 grad: 1.66e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6455 data: 0.0699 lr: 4.93e-05 mem: 47% pow: 640.967 W 0: INFO 26-04-29 08:03:24.931761 - 6:45:53 - step: 16900 acc: 0 loss: 1.5329 grad: 3.08e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6045 data: 0.1083 lr: 4.93e-05 mem: 47% pow: 636.252 W 0: INFO 26-04-29 08:03:41.759496 - 6:46:10 - step: 16910 acc: 0 loss: 1.5995 grad: 1.69e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5868 data: 0.0951 lr: 4.92e-05 mem: 54% pow: 657.677 W 0: INFO 26-04-29 08:03:55.562049 - 6:46:24 - step: 16920 acc: 0 loss: 1.5334 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6473 data: 0.0597 lr: 4.92e-05 mem: 47% pow: 638.939 W 0: INFO 26-04-29 08:04:09.115067 - 6:46:37 - step: 16930 acc: 0 loss: 1.8158 grad: 1.87e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6089 data: 0.0746 lr: 4.92e-05 mem: 47% pow: 654.464 W 0: INFO 26-04-29 08:04:23.122835 - 6:46:51 - step: 16940 acc: 0 loss: 1.8303 grad: 1.43e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6183 data: 0.0721 lr: 4.92e-05 mem: 47% pow: 653.606 W 0: INFO 26-04-29 08:04:36.678314 - 6:47:05 - step: 16950 acc: 0 loss: 1.5251 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6142 data: 0.071 lr: 4.92e-05 mem: 47% pow: 662.46 W 0: INFO 26-04-29 08:04:50.450686 - 6:47:19 - step: 16960 acc: 0 loss: 1.4965 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.617 data: 0.0723 lr: 4.92e-05 mem: 47% pow: 655.618 W 0: INFO 26-04-29 08:05:04.597302 - 6:47:33 - step: 16970 acc: 0 loss: 1.4629 grad: 1.78e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6154 data: 0.0664 lr: 4.92e-05 mem: 47% pow: 654.716 W 0: INFO 26-04-29 08:05:19.025053 - 6:47:47 - step: 16980 acc: 0 loss: 1.4822 grad: 1.47e-01 flops: 3.92e+14 wps: 4.54e+04 iter: 0.6249 data: 0.0695 lr: 4.91e-05 mem: 47% pow: 646.097 W 0: INFO 26-04-29 08:05:33.043533 - 6:48:01 - step: 16990 acc: 0 loss: 1.3887 grad: 1.52e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.597 data: 0.0871 lr: 4.91e-05 mem: 47% pow: 655.872 W 0: INFO 26-04-29 08:05:47.199536 - 6:48:15 - step: 17000 acc: 0 loss: 1.0922 grad: 1.47e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.616 data: 0.0661 lr: 4.91e-05 mem: 47% pow: 651.107 W 0: INFO 26-04-29 08:05:50.924979 - 6:48:19 - garbage collection 0: INFO 26-04-29 08:06:05.574893 - 6:48:34 - step: 17010 acc: 0 loss: 1.3114 grad: 1.67e-01 flops: 3.07e+14 wps: 3.57e+04 iter: 0.6128 data: 0.0645 lr: 4.91e-05 mem: 54% pow: 646.541 W 0: INFO 26-04-29 08:06:19.443752 - 6:48:48 - step: 17020 acc: 0 loss: 1.4927 grad: 1.58e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6732 data: 0.0674 lr: 4.91e-05 mem: 47% pow: 615.981 W 0: INFO 26-04-29 08:06:33.362358 - 6:49:01 - step: 17030 acc: 0 loss: 1.4618 grad: 1.49e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6431 data: 0.0666 lr: 4.91e-05 mem: 47% pow: 638.094 W 0: INFO 26-04-29 08:06:47.357794 - 6:49:15 - step: 17040 acc: 0 loss: 1.3691 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6322 data: 0.0675 lr: 4.90e-05 mem: 47% pow: 644.118 W 0: INFO 26-04-29 08:07:01.172907 - 6:49:29 - step: 17050 acc: 0 loss: 1.3664 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.646 data: 0.0399 lr: 4.90e-05 mem: 47% pow: 657.735 W 0: INFO 26-04-29 08:07:14.870527 - 6:49:43 - step: 17060 acc: 0 loss: 1.4892 grad: 1.54e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6385 data: 0.0595 lr: 4.90e-05 mem: 47% pow: 650.226 W 0: INFO 26-04-29 08:07:28.512231 - 6:49:57 - step: 17070 acc: 0 loss: 1.2381 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6341 data: 0.0636 lr: 4.90e-05 mem: 47% pow: 656.114 W 0: INFO 26-04-29 08:07:42.199262 - 6:50:10 - step: 17080 acc: 0 loss: 1.2027 grad: 1.75e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6434 data: 0.0596 lr: 4.90e-05 mem: 47% pow: 645.77 W 0: INFO 26-04-29 08:07:56.205072 - 6:50:24 - step: 17090 acc: 0 loss: 1.2888 grad: 1.48e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6597 data: 0.0334 lr: 4.90e-05 mem: 47% pow: 644.309 W 0: INFO 26-04-29 08:08:09.801926 - 6:50:38 - step: 17100 acc: 0 loss: 1.4814 grad: 1.51e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.609 data: 0.0694 lr: 4.90e-05 mem: 47% pow: 657.909 W 0: INFO 26-04-29 08:08:26.502164 - 6:50:55 - step: 17110 acc: 0 loss: 1.5281 grad: 1.57e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.622 data: 0.0665 lr: 4.89e-05 mem: 54% pow: 652.481 W 0: INFO 26-04-29 08:08:40.356364 - 6:51:08 - step: 17120 acc: 0 loss: 1.8558 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.607 data: 0.0706 lr: 4.89e-05 mem: 47% pow: 652.524 W 0: INFO 26-04-29 08:08:54.230217 - 6:51:22 - step: 17130 acc: 0 loss: 1.2855 grad: 1.63e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6291 data: 0.0658 lr: 4.89e-05 mem: 47% pow: 650.266 W 0: INFO 26-04-29 08:09:08.315416 - 6:51:36 - step: 17140 acc: 0 loss: 1.4272 grad: 1.51e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.8422 data: 0.0027 lr: 4.89e-05 mem: 47% pow: 559.435 W 0: INFO 26-04-29 08:09:21.859780 - 6:51:50 - step: 17150 acc: 0 loss: 1.6521 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6181 data: 0.0706 lr: 4.89e-05 mem: 47% pow: 656.382 W 0: INFO 26-04-29 08:09:35.751507 - 6:52:04 - step: 17160 acc: 0 loss: 1.2233 grad: 1.50e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5923 data: 0.0759 lr: 4.89e-05 mem: 47% pow: 668.157 W 0: INFO 26-04-29 08:09:49.397429 - 6:52:17 - step: 17170 acc: 0 loss: 1.5677 grad: 1.45e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6323 data: 0.0723 lr: 4.89e-05 mem: 47% pow: 642.466 W 0: INFO 26-04-29 08:10:03.121063 - 6:52:31 - step: 17180 acc: 0 loss: 1.4637 grad: 1.84e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.654 data: 0.0755 lr: 4.88e-05 mem: 47% pow: 627.591 W 0: INFO 26-04-29 08:10:16.816913 - 6:52:45 - step: 17190 acc: 0 loss: 1.2264 grad: 1.66e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6453 data: 0.0773 lr: 4.88e-05 mem: 47% pow: 629.957 W 0: INFO 26-04-29 08:10:30.953749 - 6:52:59 - step: 17200 acc: 0 loss: 1.1656 grad: 1.61e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6515 data: 0.0668 lr: 4.88e-05 mem: 47% pow: 632.833 W 0: INFO 26-04-29 08:10:47.840924 - 6:53:16 - step: 17210 acc: 0 loss: 1.3203 grad: 1.65e-01 flops: 3.35e+14 wps: 3.88e+04 iter: 0.5896 data: 0.0943 lr: 4.88e-05 mem: 54% pow: 654.957 W 0: INFO 26-04-29 08:11:01.455972 - 6:53:30 - step: 17220 acc: 0 loss: 1.4363 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6227 data: 0.0774 lr: 4.88e-05 mem: 47% pow: 655.323 W 0: INFO 26-04-29 08:11:15.369532 - 6:53:43 - step: 17230 acc: 0 loss: 1.4397 grad: 1.42e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.655 data: 0.0584 lr: 4.88e-05 mem: 47% pow: 636.148 W 0: INFO 26-04-29 08:11:29.384180 - 6:53:57 - step: 17240 acc: 0 loss: 1.3753 grad: 1.56e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6296 data: 0.0721 lr: 4.87e-05 mem: 47% pow: 665.426 W 0: INFO 26-04-29 08:11:45.504979 - 6:54:14 - step: 17250 acc: 0 loss: 1.7634 grad: 1.51e-01 flops: 3.50e+14 wps: 4.07e+04 iter: 0.7069 data: 0.066 lr: 4.87e-05 mem: 47% pow: 600.613 W 0: INFO 26-04-29 08:11:59.177836 - 6:54:27 - step: 17260 acc: 0 loss: 1.5333 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6154 data: 0.0695 lr: 4.87e-05 mem: 47% pow: 650.446 W 0: INFO 26-04-29 08:12:13.136653 - 6:54:41 - step: 17270 acc: 0 loss: 1.8228 grad: 1.62e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6126 data: 0.0739 lr: 4.87e-05 mem: 47% pow: 654.663 W 0: INFO 26-04-29 08:12:26.895313 - 6:54:55 - step: 17280 acc: 0 loss: 1.8884 grad: 1.63e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6038 data: 0.0712 lr: 4.87e-05 mem: 47% pow: 660.507 W 0: INFO 26-04-29 08:12:40.870055 - 6:55:09 - step: 17290 acc: 0 loss: 1.4364 grad: 1.62e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6594 data: 0.0699 lr: 4.87e-05 mem: 47% pow: 642.977 W 0: INFO 26-04-29 08:12:54.701084 - 6:55:23 - step: 17300 acc: 0 loss: 1.7288 grad: 1.91e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6491 data: 0.0676 lr: 4.87e-05 mem: 47% pow: 631.32 W 0: INFO 26-04-29 08:13:11.469974 - 6:55:40 - step: 17310 acc: 0 loss: 1.3715 grad: 1.46e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.7004 data: 0.0713 lr: 4.86e-05 mem: 54% pow: 604.389 W 0: INFO 26-04-29 08:13:25.228641 - 6:55:53 - step: 17320 acc: 0 loss: 1.5697 grad: 1.45e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6721 data: 0.0574 lr: 4.86e-05 mem: 47% pow: 630.412 W 0: INFO 26-04-29 08:13:38.800503 - 6:56:07 - step: 17330 acc: 0 loss: 1.4 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6172 data: 0.0721 lr: 4.86e-05 mem: 47% pow: 655.151 W 0: INFO 26-04-29 08:13:52.803308 - 6:56:21 - step: 17340 acc: 0 loss: 1.321 grad: 1.46e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6085 data: 0.0696 lr: 4.86e-05 mem: 47% pow: 676.856 W 0: INFO 26-04-29 08:14:06.741781 - 6:56:35 - step: 17350 acc: 0 loss: 1.4095 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6367 data: 0.0666 lr: 4.86e-05 mem: 47% pow: 639.226 W 0: INFO 26-04-29 08:14:20.955085 - 6:56:49 - step: 17360 acc: 0 loss: 1.6305 grad: 1.57e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6475 data: 0.0677 lr: 4.86e-05 mem: 47% pow: 646.211 W 0: INFO 26-04-29 08:14:34.975421 - 6:57:03 - step: 17370 acc: 0 loss: 1.4003 grad: 1.55e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6155 data: 0.0791 lr: 4.86e-05 mem: 47% pow: 649.573 W 0: INFO 26-04-29 08:14:48.833754 - 6:57:17 - step: 17380 acc: 0 loss: 1.2833 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6283 data: 0.0679 lr: 4.85e-05 mem: 47% pow: 645.895 W 0: INFO 26-04-29 08:15:02.913905 - 6:57:31 - step: 17390 acc: 0 loss: 1.378 grad: 1.50e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6599 data: 0.0546 lr: 4.85e-05 mem: 47% pow: 635.797 W 0: INFO 26-04-29 08:15:16.841860 - 6:57:45 - step: 17400 acc: 0 loss: 1.5882 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6892 data: 0.0715 lr: 4.85e-05 mem: 47% pow: 606.947 W 0: INFO 26-04-29 08:15:33.623406 - 6:58:02 - step: 17410 acc: 0 loss: 1.4983 grad: 1.73e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6401 data: 0.0691 lr: 4.85e-05 mem: 54% pow: 644.442 W 0: INFO 26-04-29 08:15:47.741760 - 6:58:16 - step: 17420 acc: 0 loss: 1.4799 grad: 1.74e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5972 data: 0.0738 lr: 4.85e-05 mem: 47% pow: 665.373 W 0: INFO 26-04-29 08:16:01.921411 - 6:58:30 - step: 17430 acc: 0 loss: 1.9353 grad: 1.59e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6423 data: 0.0677 lr: 4.85e-05 mem: 47% pow: 645.89 W 0: INFO 26-04-29 08:16:18.429816 - 6:58:47 - step: 17440 acc: 0 loss: 1.5009 grad: 1.65e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.628 data: 0.0674 lr: 4.85e-05 mem: 47% pow: 652.368 W 0: INFO 26-04-29 08:16:32.498067 - 6:59:01 - step: 17450 acc: 0 loss: 1.1201 grad: 1.54e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6763 data: 0.0703 lr: 4.84e-05 mem: 47% pow: 621.268 W 0: INFO 26-04-29 08:16:46.441453 - 6:59:15 - step: 17460 acc: 0 loss: 1.4351 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6932 data: 0.0329 lr: 4.84e-05 mem: 47% pow: 639.089 W 0: INFO 26-04-29 08:17:00.331300 - 6:59:28 - step: 17470 acc: 0 loss: 1.556 grad: 1.66e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6344 data: 0.0649 lr: 4.84e-05 mem: 47% pow: 644.467 W 0: INFO 26-04-29 08:17:13.943087 - 6:59:42 - step: 17480 acc: 0 loss: 1.7472 grad: 1.62e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6154 data: 0.0692 lr: 4.84e-05 mem: 47% pow: 647.37 W 0: INFO 26-04-29 08:17:27.851187 - 6:59:56 - step: 17490 acc: 0 loss: 1.6899 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6235 data: 0.0701 lr: 4.84e-05 mem: 47% pow: 652.829 W 0: INFO 26-04-29 08:17:42.042022 - 7:00:10 - step: 17500 acc: 0 loss: 1.4794 grad: 1.48e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.667 data: 0.0631 lr: 4.84e-05 mem: 47% pow: 625.408 W 0: INFO 26-04-29 08:17:58.671916 - 7:00:27 - step: 17510 acc: 0 loss: 1.2702 grad: 1.67e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6157 data: 0.0651 lr: 4.83e-05 mem: 54% pow: 653.983 W 0: INFO 26-04-29 08:18:12.468142 - 7:00:41 - step: 17520 acc: 0 loss: 1.7705 grad: 1.68e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6473 data: 0.0752 lr: 4.83e-05 mem: 47% pow: 626.754 W 0: INFO 26-04-29 08:18:26.355180 - 7:00:54 - step: 17530 acc: 0 loss: 1.6732 grad: 1.56e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.648 data: 0.071 lr: 4.83e-05 mem: 47% pow: 623.992 W 0: INFO 26-04-29 08:18:40.468152 - 7:01:09 - step: 17540 acc: 0 loss: 1.4274 grad: 1.54e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.627 data: 0.0674 lr: 4.83e-05 mem: 47% pow: 658.593 W 0: INFO 26-04-29 08:18:54.487416 - 7:01:23 - step: 17550 acc: 0 loss: 1.7198 grad: 1.88e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6242 data: 0.0711 lr: 4.83e-05 mem: 47% pow: 644.651 W 0: INFO 26-04-29 08:19:08.360508 - 7:01:36 - step: 17560 acc: 0 loss: 1.2247 grad: 1.53e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6328 data: 0.0923 lr: 4.83e-05 mem: 47% pow: 641.93 W 0: INFO 26-04-29 08:19:24.940201 - 7:01:53 - step: 17570 acc: 0 loss: 1.619 grad: 1.50e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6772 data: 0.0482 lr: 4.83e-05 mem: 47% pow: 622.318 W 0: INFO 26-04-29 08:19:38.941857 - 7:02:07 - step: 17580 acc: 0 loss: 1.4408 grad: 1.51e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6705 data: 0.0727 lr: 4.82e-05 mem: 47% pow: 616.864 W 0: INFO 26-04-29 08:19:52.549763 - 7:02:21 - step: 17590 acc: 0 loss: 1.3256 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6006 data: 0.0773 lr: 4.82e-05 mem: 47% pow: 651.471 W 0: INFO 26-04-29 08:20:06.445257 - 7:02:35 - step: 17600 acc: 0 loss: 1.4492 grad: 1.50e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6115 data: 0.0694 lr: 4.82e-05 mem: 47% pow: 644.111 W 0: INFO 26-04-29 08:20:23.387926 - 7:02:51 - step: 17610 acc: 0 loss: 1.3594 grad: 1.49e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6679 data: 0.0665 lr: 4.82e-05 mem: 54% pow: 624.463 W 0: INFO 26-04-29 08:20:37.118113 - 7:03:05 - step: 17620 acc: 0 loss: 1.5583 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5996 data: 0.083 lr: 4.82e-05 mem: 47% pow: 658.061 W 0: INFO 26-04-29 08:20:50.980887 - 7:03:19 - step: 17630 acc: 0 loss: 1.3324 grad: 1.55e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.7518 data: 0.0683 lr: 4.82e-05 mem: 47% pow: 593.431 W 0: INFO 26-04-29 08:21:05.098024 - 7:03:33 - step: 17640 acc: 0 loss: 1.0516 grad: 1.54e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.7832 data: 0.0775 lr: 4.82e-05 mem: 47% pow: 547.703 W 0: INFO 26-04-29 08:21:19.251706 - 7:03:47 - step: 17650 acc: 0 loss: 1.5043 grad: 1.48e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6092 data: 0.0926 lr: 4.81e-05 mem: 47% pow: 637.004 W 0: INFO 26-04-29 08:21:32.778840 - 7:04:01 - step: 17660 acc: 0 loss: 1.4229 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5999 data: 0.0816 lr: 4.81e-05 mem: 47% pow: 653.243 W 0: INFO 26-04-29 08:21:46.639554 - 7:04:15 - step: 17670 acc: 0 loss: 1.3583 grad: 1.52e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6377 data: 0.0675 lr: 4.81e-05 mem: 47% pow: 641.328 W 0: INFO 26-04-29 08:22:00.577661 - 7:04:29 - step: 17680 acc: 0 loss: 1.3999 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6179 data: 0.0686 lr: 4.81e-05 mem: 47% pow: 649.359 W 0: INFO 26-04-29 08:22:14.696936 - 7:04:43 - step: 17690 acc: 0 loss: 1.2618 grad: 1.48e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6458 data: 0.0662 lr: 4.81e-05 mem: 47% pow: 643.986 W 0: INFO 26-04-29 08:22:28.389706 - 7:04:56 - step: 17700 acc: 0 loss: 1.2848 grad: 1.53e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6097 data: 0.0872 lr: 4.81e-05 mem: 47% pow: 642.505 W 0: INFO 26-04-29 08:22:45.039827 - 7:05:13 - step: 17710 acc: 0 loss: 1.4061 grad: 1.46e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6133 data: 0.0671 lr: 4.80e-05 mem: 54% pow: 650.187 W 0: INFO 26-04-29 08:22:58.842416 - 7:05:27 - step: 17720 acc: 0 loss: 1.6164 grad: 1.55e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6186 data: 0.0718 lr: 4.80e-05 mem: 47% pow: 647.611 W 0: INFO 26-04-29 08:23:12.539380 - 7:05:41 - step: 17730 acc: 0 loss: 1.4676 grad: 1.52e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.664 data: 0.0609 lr: 4.80e-05 mem: 47% pow: 627.209 W 0: INFO 26-04-29 08:23:26.580029 - 7:05:55 - step: 17740 acc: 0 loss: 1.817 grad: 1.69e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6555 data: 0.0726 lr: 4.80e-05 mem: 47% pow: 629.326 W 0: INFO 26-04-29 08:23:40.312620 - 7:06:08 - step: 17750 acc: 0 loss: 1.1304 grad: 1.54e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6163 data: 0.0716 lr: 4.80e-05 mem: 47% pow: 649.317 W 0: INFO 26-04-29 08:23:54.417498 - 7:06:23 - step: 17760 acc: 0 loss: 1.7298 grad: 1.59e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6056 data: 0.0773 lr: 4.80e-05 mem: 47% pow: 656.359 W 0: INFO 26-04-29 08:24:08.502349 - 7:06:37 - step: 17770 acc: 0 loss: 1.3318 grad: 1.54e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6374 data: 0.054 lr: 4.80e-05 mem: 47% pow: 652.197 W 0: INFO 26-04-29 08:24:22.197806 - 7:06:50 - step: 17780 acc: 0 loss: 1.655 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6243 data: 0.0669 lr: 4.79e-05 mem: 47% pow: 652.596 W 0: INFO 26-04-29 08:24:36.445883 - 7:07:05 - step: 17790 acc: 0 loss: 1.664 grad: 1.50e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6342 data: 0.0615 lr: 4.79e-05 mem: 47% pow: 639.367 W 0: INFO 26-04-29 08:24:50.317059 - 7:07:18 - step: 17800 acc: 0 loss: 1.6989 grad: 1.53e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6316 data: 0.0686 lr: 4.79e-05 mem: 47% pow: 642.92 W 0: INFO 26-04-29 08:25:06.929152 - 7:07:35 - step: 17810 acc: 0 loss: 1.3686 grad: 1.48e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6533 data: 0.0622 lr: 4.79e-05 mem: 54% pow: 643.888 W 0: INFO 26-04-29 08:25:20.555740 - 7:07:49 - step: 17820 acc: 0 loss: 1.4471 grad: 1.47e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6174 data: 0.0714 lr: 4.79e-05 mem: 47% pow: 665.102 W 0: INFO 26-04-29 08:25:34.199843 - 7:08:02 - step: 17830 acc: 0 loss: 1.4828 grad: 1.66e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7016 data: 0.0653 lr: 4.79e-05 mem: 47% pow: 605.754 W 0: INFO 26-04-29 08:25:47.885129 - 7:08:16 - step: 17840 acc: 0 loss: 1.4432 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6114 data: 0.0699 lr: 4.79e-05 mem: 47% pow: 654.28 W 0: INFO 26-04-29 08:26:01.791456 - 7:08:30 - step: 17850 acc: 0 loss: 1.0558 grad: 1.58e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.618 data: 0.0593 lr: 4.78e-05 mem: 47% pow: 665.57 W 0: INFO 26-04-29 08:26:15.546410 - 7:08:44 - step: 17860 acc: 0 loss: 1.2788 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6255 data: 0.063 lr: 4.78e-05 mem: 47% pow: 656.167 W 0: INFO 26-04-29 08:26:29.453558 - 7:08:58 - step: 17870 acc: 0 loss: 1.4197 grad: 1.58e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.669 data: 0.0484 lr: 4.78e-05 mem: 47% pow: 629.082 W 0: INFO 26-04-29 08:26:43.375171 - 7:09:11 - step: 17880 acc: 0 loss: 1.691 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6122 data: 0.0682 lr: 4.78e-05 mem: 47% pow: 650.846 W 0: INFO 26-04-29 08:26:57.554423 - 7:09:26 - step: 17890 acc: 0 loss: 1.1985 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6734 data: 0.0648 lr: 4.78e-05 mem: 47% pow: 626.041 W 0: INFO 26-04-29 08:27:11.631892 - 7:09:40 - step: 17900 acc: 0 loss: 1.86 grad: 1.51e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6107 data: 0.0702 lr: 4.78e-05 mem: 47% pow: 653.679 W 0: INFO 26-04-29 08:27:31.594437 - 7:10:00 - step: 17910 acc: 0 loss: 1.602 grad: 1.47e-01 flops: 2.83e+14 wps: 3.28e+04 iter: 3.9577 data: 0.0789 lr: 4.78e-05 mem: 54% pow: 446.174 W 0: INFO 26-04-29 08:27:45.491755 - 7:10:14 - step: 17920 acc: 0 loss: 1.0832 grad: 1.46e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6168 data: 0.0822 lr: 4.77e-05 mem: 47% pow: 646.132 W 0: INFO 26-04-29 08:27:59.791902 - 7:10:28 - step: 17930 acc: 0 loss: 1.5041 grad: 1.54e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6753 data: 0.0604 lr: 4.77e-05 mem: 47% pow: 625.16 W 0: INFO 26-04-29 08:28:13.573107 - 7:10:42 - step: 17940 acc: 0 loss: 1.4339 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6523 data: 0.0661 lr: 4.77e-05 mem: 47% pow: 636.0 W 0: INFO 26-04-29 08:28:27.170987 - 7:10:55 - step: 17950 acc: 0 loss: 1.5556 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6115 data: 0.0679 lr: 4.77e-05 mem: 47% pow: 652.619 W 0: INFO 26-04-29 08:28:40.811446 - 7:11:09 - step: 17960 acc: 0 loss: 1.4025 grad: 1.42e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6289 data: 0.0643 lr: 4.77e-05 mem: 47% pow: 643.123 W 0: INFO 26-04-29 08:28:54.778900 - 7:11:23 - step: 17970 acc: 0 loss: 1.6257 grad: 1.43e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6079 data: 0.0703 lr: 4.77e-05 mem: 47% pow: 659.495 W 0: INFO 26-04-29 08:29:10.207920 - 7:11:38 - step: 17980 acc: 0 loss: 1.415 grad: 1.50e-01 flops: 3.66e+14 wps: 4.25e+04 iter: 0.6292 data: 0.0659 lr: 4.76e-05 mem: 47% pow: 638.856 W 0: INFO 26-04-29 08:29:24.873424 - 7:11:53 - step: 17990 acc: 0 loss: 1.5047 grad: 1.49e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6202 data: 0.0806 lr: 4.76e-05 mem: 47% pow: 653.935 W 0: INFO 26-04-29 08:29:38.472362 - 7:12:07 - step: 18000 acc: 0 loss: 1.2657 grad: 1.69e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6483 data: 0.0273 lr: 4.76e-05 mem: 47% pow: 658.056 W 0: INFO 26-04-29 08:29:42.157260 - 7:12:10 - garbage collection 0: INFO 26-04-29 08:29:57.031660 - 7:12:25 - step: 18010 acc: 0 loss: 1.2543 grad: 1.41e-01 flops: 3.04e+14 wps: 3.53e+04 iter: 0.634 data: 0.1003 lr: 4.76e-05 mem: 54% pow: 619.675 W 0: INFO 26-04-29 08:30:10.809541 - 7:12:39 - step: 18020 acc: 0 loss: 1.6871 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6133 data: 0.064 lr: 4.76e-05 mem: 47% pow: 662.617 W 0: INFO 26-04-29 08:30:24.710946 - 7:12:53 - step: 18030 acc: 0 loss: 1.2202 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6368 data: 0.0662 lr: 4.76e-05 mem: 47% pow: 641.115 W 0: INFO 26-04-29 08:30:38.612037 - 7:13:07 - step: 18040 acc: 0 loss: 1.7266 grad: 2.70e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6129 data: 0.1 lr: 4.76e-05 mem: 47% pow: 638.297 W 0: INFO 26-04-29 08:30:52.584192 - 7:13:21 - step: 18050 acc: 0 loss: 1.1613 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6514 data: 0.0391 lr: 4.75e-05 mem: 47% pow: 651.117 W 0: INFO 26-04-29 08:31:07.083359 - 7:13:35 - step: 18060 acc: 0 loss: 1.6486 grad: 1.52e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.6236 data: 0.063 lr: 4.75e-05 mem: 47% pow: 657.2 W 0: INFO 26-04-29 08:31:20.912433 - 7:13:49 - step: 18070 acc: 0 loss: 1.3655 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6107 data: 0.0689 lr: 4.75e-05 mem: 47% pow: 647.881 W 0: INFO 26-04-29 08:31:35.826430 - 7:14:04 - step: 18080 acc: 0 loss: 1.4074 grad: 1.50e-01 flops: 3.79e+14 wps: 4.39e+04 iter: 1.1814 data: 0.0711 lr: 4.75e-05 mem: 47% pow: 420.129 W 0: INFO 26-04-29 08:31:51.502148 - 7:14:20 - step: 18090 acc: 0 loss: 1.6606 grad: 1.51e-01 flops: 3.60e+14 wps: 4.18e+04 iter: 0.7304 data: 0.0216 lr: 4.75e-05 mem: 47% pow: 615.067 W 0: INFO 26-04-29 08:32:05.483508 - 7:14:34 - step: 18100 acc: 0 loss: 1.4189 grad: 1.64e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6113 data: 0.0713 lr: 4.75e-05 mem: 47% pow: 647.013 W 0: INFO 26-04-29 08:32:22.813593 - 7:14:51 - step: 18110 acc: 0 loss: 1.542 grad: 1.53e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.6294 data: 0.0687 lr: 4.75e-05 mem: 54% pow: 645.128 W 0: INFO 26-04-29 08:32:37.391715 - 7:15:05 - step: 18120 acc: 0 loss: 1.4028 grad: 1.46e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6702 data: 0.0653 lr: 4.74e-05 mem: 47% pow: 622.762 W 0: INFO 26-04-29 08:32:50.941649 - 7:15:19 - step: 18130 acc: 0 loss: 1.6127 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6199 data: 0.0704 lr: 4.74e-05 mem: 47% pow: 654.36 W 0: INFO 26-04-29 08:33:06.145522 - 7:15:34 - step: 18140 acc: 0 loss: 1.4282 grad: 1.50e-01 flops: 3.72e+14 wps: 4.31e+04 iter: 0.6402 data: 0.0648 lr: 4.74e-05 mem: 47% pow: 644.753 W 0: INFO 26-04-29 08:33:20.122686 - 7:15:48 - step: 18150 acc: 0 loss: 1.4806 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6709 data: 0.0714 lr: 4.74e-05 mem: 47% pow: 617.993 W 0: INFO 26-04-29 08:33:33.959312 - 7:16:02 - step: 18160 acc: 0 loss: 1.3986 grad: 1.48e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7117 data: 0.0725 lr: 4.74e-05 mem: 47% pow: 593.47 W 0: INFO 26-04-29 08:33:54.628960 - 7:16:23 - step: 18170 acc: 0 loss: 1.2678 grad: 1.46e-01 flops: 2.73e+14 wps: 3.17e+04 iter: 0.802 data: 0.0695 lr: 4.74e-05 mem: 47% pow: 553.358 W 0: INFO 26-04-29 08:34:08.436118 - 7:16:37 - step: 18180 acc: 0 loss: 1.386 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6185 data: 0.0756 lr: 4.73e-05 mem: 47% pow: 648.977 W 0: INFO 26-04-29 08:34:23.196967 - 7:16:51 - step: 18190 acc: 0 loss: 1.3335 grad: 1.55e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.635 data: 0.0677 lr: 4.73e-05 mem: 47% pow: 641.533 W 0: INFO 26-04-29 08:34:37.959183 - 7:17:06 - step: 18200 acc: 0 loss: 1.3758 grad: 1.48e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.5931 data: 0.0727 lr: 4.73e-05 mem: 47% pow: 662.329 W 0: INFO 26-04-29 08:34:54.923938 - 7:17:23 - step: 18210 acc: 0 loss: 1.333 grad: 1.62e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.6523 data: 0.0734 lr: 4.73e-05 mem: 54% pow: 631.733 W 0: INFO 26-04-29 08:35:08.664801 - 7:17:37 - step: 18220 acc: 0 loss: 1.2441 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6511 data: 0.0625 lr: 4.73e-05 mem: 47% pow: 640.588 W 0: INFO 26-04-29 08:35:23.162682 - 7:17:51 - step: 18230 acc: 0 loss: 1.3654 grad: 1.47e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.7595 data: 0.0647 lr: 4.73e-05 mem: 47% pow: 582.048 W 0: INFO 26-04-29 08:35:39.697012 - 7:18:08 - step: 18240 acc: 0 loss: 1.3289 grad: 1.48e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.63 data: 0.0725 lr: 4.73e-05 mem: 47% pow: 643.675 W 0: INFO 26-04-29 08:35:58.623456 - 7:18:27 - step: 18250 acc: 0 loss: 1.3804 grad: 1.51e-01 flops: 2.98e+14 wps: 3.46e+04 iter: 0.7242 data: 0.0775 lr: 4.72e-05 mem: 47% pow: 594.553 W 0: INFO 26-04-29 08:36:12.790781 - 7:18:41 - step: 18260 acc: 0 loss: 1.1795 grad: 1.49e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6275 data: 0.0671 lr: 4.72e-05 mem: 47% pow: 650.385 W 0: INFO 26-04-29 08:36:26.747996 - 7:18:55 - step: 18270 acc: 0 loss: 1.4416 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6115 data: 0.075 lr: 4.72e-05 mem: 47% pow: 648.27 W 0: INFO 26-04-29 08:36:40.833374 - 7:19:09 - step: 18280 acc: 0 loss: 1.4179 grad: 1.52e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6065 data: 0.0766 lr: 4.72e-05 mem: 47% pow: 654.974 W 0: INFO 26-04-29 08:36:54.799475 - 7:19:23 - step: 18290 acc: 0 loss: 1.4513 grad: 1.46e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6307 data: 0.0764 lr: 4.72e-05 mem: 47% pow: 653.734 W 0: INFO 26-04-29 08:37:08.630485 - 7:19:37 - step: 18300 acc: 0 loss: 1.4987 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6066 data: 0.0733 lr: 4.72e-05 mem: 47% pow: 654.969 W 0: INFO 26-04-29 08:37:25.503672 - 7:19:54 - step: 18310 acc: 0 loss: 1.2047 grad: 1.57e-01 flops: 3.35e+14 wps: 3.88e+04 iter: 0.6161 data: 0.077 lr: 4.72e-05 mem: 54% pow: 648.333 W 0: INFO 26-04-29 08:37:48.178574 - 7:20:16 - step: 18320 acc: 0 loss: 1.4541 grad: 1.61e-01 flops: 2.49e+14 wps: 2.89e+04 iter: 0.6727 data: 0.0738 lr: 4.71e-05 mem: 47% pow: 628.487 W 0: INFO 26-04-29 08:38:02.929148 - 7:20:31 - step: 18330 acc: 0 loss: 1.2825 grad: 1.62e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.621 data: 0.0766 lr: 4.71e-05 mem: 47% pow: 645.904 W 0: INFO 26-04-29 08:38:19.406448 - 7:20:47 - step: 18340 acc: 0 loss: 1.4159 grad: 1.50e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6233 data: 0.0865 lr: 4.71e-05 mem: 47% pow: 640.382 W 0: INFO 26-04-29 08:38:33.454498 - 7:21:02 - step: 18350 acc: 0 loss: 1.2843 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6517 data: 0.066 lr: 4.71e-05 mem: 47% pow: 628.474 W 0: INFO 26-04-29 08:38:48.622257 - 7:21:17 - step: 18360 acc: 0 loss: 1.4456 grad: 1.49e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.698 data: 0.0726 lr: 4.71e-05 mem: 47% pow: 601.785 W 0: INFO 26-04-29 08:39:03.394535 - 7:21:31 - step: 18370 acc: 0 loss: 1.4139 grad: 1.52e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.8693 data: 0.0675 lr: 4.71e-05 mem: 47% pow: 503.516 W 0: INFO 26-04-29 08:39:17.503363 - 7:21:46 - step: 18380 acc: 0 loss: 1.638 grad: 1.47e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6013 data: 0.0696 lr: 4.71e-05 mem: 47% pow: 661.827 W 0: INFO 26-04-29 08:39:33.151265 - 7:22:01 - step: 18390 acc: 0 loss: 1.3044 grad: 1.47e-01 flops: 3.61e+14 wps: 4.19e+04 iter: 0.6545 data: 0.0657 lr: 4.70e-05 mem: 47% pow: 625.439 W 0: INFO 26-04-29 08:39:47.161130 - 7:22:15 - step: 18400 acc: 0 loss: 1.3143 grad: 1.53e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6917 data: 0.072 lr: 4.70e-05 mem: 47% pow: 602.481 W 0: INFO 26-04-29 08:40:04.063865 - 7:22:32 - step: 18410 acc: 0 loss: 1.6973 grad: 1.50e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6595 data: 0.0683 lr: 4.70e-05 mem: 54% pow: 627.366 W 0: INFO 26-04-29 08:40:18.799321 - 7:22:47 - step: 18420 acc: 0 loss: 1.2807 grad: 1.45e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.703 data: 0.067 lr: 4.70e-05 mem: 47% pow: 603.111 W 0: INFO 26-04-29 08:40:32.793861 - 7:23:01 - step: 18430 acc: 0 loss: 1.752 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6481 data: 0.0698 lr: 4.70e-05 mem: 47% pow: 629.84 W 0: INFO 26-04-29 08:40:47.249392 - 7:23:15 - step: 18440 acc: 0 loss: 1.5822 grad: 1.62e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6808 data: 0.046 lr: 4.70e-05 mem: 47% pow: 638.41 W 0: INFO 26-04-29 08:41:01.256744 - 7:23:29 - step: 18450 acc: 0 loss: 1.3449 grad: 1.54e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6205 data: 0.0629 lr: 4.69e-05 mem: 47% pow: 654.809 W 0: INFO 26-04-29 08:41:15.442379 - 7:23:44 - step: 18460 acc: 0 loss: 1.4845 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6238 data: 0.0795 lr: 4.69e-05 mem: 47% pow: 638.327 W 0: INFO 26-04-29 08:41:31.388128 - 7:23:59 - step: 18470 acc: 0 loss: 1.4941 grad: 1.53e-01 flops: 3.54e+14 wps: 4.11e+04 iter: 1.0064 data: 0.0704 lr: 4.69e-05 mem: 47% pow: 440.288 W 0: INFO 26-04-29 08:41:45.386230 - 7:24:13 - step: 18480 acc: 0 loss: 1.5016 grad: 1.43e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6653 data: 0.0698 lr: 4.69e-05 mem: 47% pow: 621.432 W 0: INFO 26-04-29 08:42:03.446856 - 7:24:32 - step: 18490 acc: 0 loss: 1.3463 grad: 1.53e-01 flops: 3.13e+14 wps: 3.63e+04 iter: 0.6261 data: 0.0693 lr: 4.69e-05 mem: 47% pow: 644.622 W 0: INFO 26-04-29 08:42:17.463573 - 7:24:46 - step: 18500 acc: 0 loss: 1.4412 grad: 1.47e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6266 data: 0.0604 lr: 4.69e-05 mem: 47% pow: 657.05 W 0: INFO 26-04-29 08:42:34.748289 - 7:25:03 - step: 18510 acc: 0 loss: 1.3978 grad: 1.47e-01 flops: 3.27e+14 wps: 3.79e+04 iter: 0.6799 data: 0.0522 lr: 4.69e-05 mem: 54% pow: 632.465 W 0: INFO 26-04-29 08:42:49.325648 - 7:25:17 - step: 18520 acc: 0 loss: 1.5818 grad: 1.58e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.6178 data: 0.0775 lr: 4.68e-05 mem: 47% pow: 645.598 W 0: INFO 26-04-29 08:43:03.980340 - 7:25:32 - step: 18530 acc: 0 loss: 1.1764 grad: 1.43e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6279 data: 0.0582 lr: 4.68e-05 mem: 47% pow: 657.961 W 0: INFO 26-04-29 08:43:19.980042 - 7:25:48 - step: 18540 acc: 0 loss: 1.5749 grad: 1.50e-01 flops: 3.53e+14 wps: 4.10e+04 iter: 0.6151 data: 0.0699 lr: 4.68e-05 mem: 47% pow: 648.309 W 0: INFO 26-04-29 08:43:33.996366 - 7:26:02 - step: 18550 acc: 0 loss: 1.4069 grad: 1.54e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.643 data: 0.0743 lr: 4.68e-05 mem: 47% pow: 632.327 W 0: INFO 26-04-29 08:43:48.812033 - 7:26:17 - step: 18560 acc: 0 loss: 1.6161 grad: 1.49e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6887 data: 0.0494 lr: 4.68e-05 mem: 47% pow: 619.029 W 0: INFO 26-04-29 08:44:03.549835 - 7:26:32 - step: 18570 acc: 0 loss: 1.1687 grad: 1.45e-01 flops: 3.84e+14 wps: 4.45e+04 iter: 0.778 data: 0.0664 lr: 4.68e-05 mem: 47% pow: 565.107 W 0: INFO 26-04-29 08:44:18.712254 - 7:26:47 - step: 18580 acc: 0 loss: 1.4835 grad: 1.51e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.6104 data: 0.0789 lr: 4.68e-05 mem: 47% pow: 651.353 W 0: INFO 26-04-29 08:44:36.041493 - 7:27:04 - step: 18590 acc: 0 loss: 1.5158 grad: 1.68e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.6331 data: 0.0711 lr: 4.67e-05 mem: 47% pow: 634.142 W 0: INFO 26-04-29 08:44:50.623805 - 7:27:19 - step: 18600 acc: 0 loss: 1.4961 grad: 1.53e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.9022 data: 0.0702 lr: 4.67e-05 mem: 47% pow: 487.445 W 0: INFO 26-04-29 08:45:07.354075 - 7:27:35 - step: 18610 acc: 0 loss: 1.5645 grad: 1.46e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6083 data: 0.0706 lr: 4.67e-05 mem: 54% pow: 653.11 W 0: INFO 26-04-29 08:45:21.604387 - 7:27:50 - step: 18620 acc: 0 loss: 1.747 grad: 1.48e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.7155 data: 0.0669 lr: 4.67e-05 mem: 47% pow: 596.867 W 0: INFO 26-04-29 08:45:35.981904 - 7:28:04 - step: 18630 acc: 0 loss: 1.4737 grad: 1.52e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6551 data: 0.0704 lr: 4.67e-05 mem: 47% pow: 629.253 W 0: INFO 26-04-29 08:45:50.069161 - 7:28:18 - step: 18640 acc: 0 loss: 1.3608 grad: 1.58e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6293 data: 0.0687 lr: 4.67e-05 mem: 47% pow: 644.545 W 0: INFO 26-04-29 08:46:06.490369 - 7:28:35 - step: 18650 acc: 0 loss: 1.2072 grad: 1.45e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6469 data: 0.0755 lr: 4.67e-05 mem: 47% pow: 648.341 W 0: INFO 26-04-29 08:46:20.383198 - 7:28:48 - step: 18660 acc: 0 loss: 1.5724 grad: 1.45e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6092 data: 0.0802 lr: 4.66e-05 mem: 47% pow: 654.911 W 0: INFO 26-04-29 08:46:37.144633 - 7:29:05 - step: 18670 acc: 0 loss: 1.5407 grad: 1.52e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.7006 data: 0.0651 lr: 4.66e-05 mem: 47% pow: 607.656 W 0: INFO 26-04-29 08:46:54.304311 - 7:29:22 - step: 18680 acc: 0 loss: 1.4559 grad: 1.57e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6415 data: 0.0692 lr: 4.66e-05 mem: 47% pow: 643.104 W 0: INFO 26-04-29 08:47:08.342849 - 7:29:36 - step: 18690 acc: 0 loss: 1.5589 grad: 1.51e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6205 data: 0.0684 lr: 4.66e-05 mem: 47% pow: 650.574 W 0: INFO 26-04-29 08:47:25.222036 - 7:29:53 - step: 18700 acc: 0 loss: 1.3001 grad: 1.42e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 3.1442 data: 0.0669 lr: 4.66e-05 mem: 47% pow: 431.307 W 0: INFO 26-04-29 08:47:44.582659 - 7:30:13 - step: 18710 acc: 0 loss: 1.2669 grad: 1.49e-01 flops: 2.92e+14 wps: 3.39e+04 iter: 0.6061 data: 0.0777 lr: 4.66e-05 mem: 54% pow: 679.393 W 0: INFO 26-04-29 08:47:58.310892 - 7:30:26 - step: 18720 acc: 0 loss: 1.4651 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6027 data: 0.0745 lr: 4.65e-05 mem: 47% pow: 667.684 W 0: INFO 26-04-29 08:48:12.829706 - 7:30:41 - step: 18730 acc: 0 loss: 1.5798 grad: 1.53e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6852 data: 0.0495 lr: 4.65e-05 mem: 47% pow: 637.374 W 0: INFO 26-04-29 08:48:26.890287 - 7:30:55 - step: 18740 acc: 0 loss: 1.3939 grad: 1.73e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6433 data: 0.0705 lr: 4.65e-05 mem: 47% pow: 635.041 W 0: INFO 26-04-29 08:48:42.170670 - 7:31:10 - step: 18750 acc: 0 loss: 1.5598 grad: 1.49e-01 flops: 3.70e+14 wps: 4.29e+04 iter: 0.6248 data: 0.0689 lr: 4.65e-05 mem: 47% pow: 651.346 W 0: INFO 26-04-29 08:48:56.012726 - 7:31:24 - step: 18760 acc: 0 loss: 1.2863 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7973 data: 0.073 lr: 4.65e-05 mem: 47% pow: 548.706 W 0: INFO 26-04-29 08:49:10.458771 - 7:31:39 - step: 18770 acc: 0 loss: 1.2766 grad: 1.51e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6112 data: 0.0745 lr: 4.65e-05 mem: 47% pow: 655.62 W 0: INFO 26-04-29 08:49:24.999350 - 7:31:53 - step: 18780 acc: 0 loss: 1.1952 grad: 1.43e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.7225 data: 0.0727 lr: 4.65e-05 mem: 47% pow: 607.666 W 0: INFO 26-04-29 08:49:38.971063 - 7:32:07 - step: 18790 acc: 0 loss: 1.2258 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6185 data: 0.0719 lr: 4.64e-05 mem: 47% pow: 649.596 W 0: INFO 26-04-29 08:49:53.409337 - 7:32:21 - step: 18800 acc: 0 loss: 1.2796 grad: 1.52e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.7021 data: 0.0709 lr: 4.64e-05 mem: 47% pow: 600.166 W 0: INFO 26-04-29 08:50:10.459099 - 7:32:39 - step: 18810 acc: 0 loss: 1.4909 grad: 1.48e-01 flops: 3.31e+14 wps: 3.85e+04 iter: 0.6117 data: 0.0852 lr: 4.64e-05 mem: 54% pow: 644.789 W 0: INFO 26-04-29 08:50:24.845948 - 7:32:53 - step: 18820 acc: 0 loss: 1.3284 grad: 1.54e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6062 data: 0.0673 lr: 4.64e-05 mem: 47% pow: 654.263 W 0: INFO 26-04-29 08:50:38.919272 - 7:33:07 - step: 18830 acc: 0 loss: 1.326 grad: 1.53e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6738 data: 0.0252 lr: 4.64e-05 mem: 47% pow: 641.893 W 0: INFO 26-04-29 08:50:54.583104 - 7:33:23 - step: 18840 acc: 0 loss: 1.6733 grad: 1.54e-01 flops: 3.61e+14 wps: 4.19e+04 iter: 0.647 data: 0.0787 lr: 4.64e-05 mem: 47% pow: 632.007 W 0: INFO 26-04-29 08:51:08.468618 - 7:33:37 - step: 18850 acc: 0 loss: 1.359 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6539 data: 0.0553 lr: 4.64e-05 mem: 47% pow: 646.597 W 0: INFO 26-04-29 08:51:22.778999 - 7:33:51 - step: 18860 acc: 0 loss: 1.415 grad: 1.62e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6237 data: 0.1019 lr: 4.63e-05 mem: 47% pow: 641.731 W 0: INFO 26-04-29 08:51:36.622066 - 7:34:05 - step: 18870 acc: 0 loss: 1.2185 grad: 1.41e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6685 data: 0.0686 lr: 4.63e-05 mem: 47% pow: 631.007 W 0: INFO 26-04-29 08:51:50.495562 - 7:34:19 - step: 18880 acc: 0 loss: 1.0909 grad: 1.45e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.7603 data: 0.071 lr: 4.63e-05 mem: 47% pow: 573.998 W 0: INFO 26-04-29 08:52:04.241741 - 7:34:32 - step: 18890 acc: 0 loss: 1.3728 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6048 data: 0.0758 lr: 4.63e-05 mem: 47% pow: 650.052 W 0: INFO 26-04-29 08:52:18.392270 - 7:34:46 - step: 18900 acc: 0 loss: 1.4636 grad: 1.48e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6901 data: 0.0834 lr: 4.63e-05 mem: 47% pow: 598.903 W 0: INFO 26-04-29 08:52:35.033441 - 7:35:03 - step: 18910 acc: 0 loss: 1.3551 grad: 1.49e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6272 data: 0.0708 lr: 4.63e-05 mem: 54% pow: 641.588 W 0: INFO 26-04-29 08:52:48.903563 - 7:35:17 - step: 18920 acc: 0 loss: 1.6688 grad: 1.61e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6264 data: 0.0656 lr: 4.62e-05 mem: 47% pow: 649.284 W 0: INFO 26-04-29 08:53:03.151771 - 7:35:31 - step: 18930 acc: 0 loss: 1.6197 grad: 1.44e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.7493 data: 0.0026 lr: 4.62e-05 mem: 47% pow: 618.128 W 0: INFO 26-04-29 08:53:17.638360 - 7:35:46 - step: 18940 acc: 0 loss: 1.443 grad: 1.55e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 1.1512 data: 0.0656 lr: 4.62e-05 mem: 47% pow: 425.166 W 0: INFO 26-04-29 08:53:31.590828 - 7:36:00 - step: 18950 acc: 0 loss: 1.7167 grad: 1.71e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6266 data: 0.0673 lr: 4.62e-05 mem: 47% pow: 648.665 W 0: INFO 26-04-29 08:53:47.646723 - 7:36:16 - step: 18960 acc: 0 loss: 1.5023 grad: 1.64e-01 flops: 3.52e+14 wps: 4.08e+04 iter: 0.6339 data: 0.0736 lr: 4.62e-05 mem: 47% pow: 642.053 W 0: INFO 26-04-29 08:54:01.528562 - 7:36:30 - step: 18970 acc: 0 loss: 1.0979 grad: 1.59e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6424 data: 0.0728 lr: 4.62e-05 mem: 47% pow: 631.884 W 0: INFO 26-04-29 08:54:15.424825 - 7:36:44 - step: 18980 acc: 0 loss: 1.5849 grad: 1.51e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5959 data: 0.0907 lr: 4.62e-05 mem: 47% pow: 655.446 W 0: INFO 26-04-29 08:54:29.581660 - 7:36:58 - step: 18990 acc: 0 loss: 1.548 grad: 1.55e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6709 data: 0.0375 lr: 4.61e-05 mem: 47% pow: 635.912 W 0: INFO 26-04-29 08:54:43.726971 - 7:37:12 - step: 19000 acc: 0 loss: 1.4425 grad: 1.65e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6309 data: 0.0677 lr: 4.61e-05 mem: 47% pow: 663.1 W 0: INFO 26-04-29 08:54:47.394598 - 7:37:15 - garbage collection 0: INFO 26-04-29 08:55:02.439260 - 7:37:31 - step: 19010 acc: 0 loss: 1.2666 grad: 1.63e-01 flops: 3.02e+14 wps: 3.50e+04 iter: 0.6387 data: 0.0674 lr: 4.61e-05 mem: 54% pow: 639.97 W 0: INFO 26-04-29 08:55:16.237464 - 7:37:44 - step: 19020 acc: 0 loss: 1.4221 grad: 1.60e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6075 data: 0.0706 lr: 4.61e-05 mem: 47% pow: 648.158 W 0: INFO 26-04-29 08:55:30.102833 - 7:37:58 - step: 19030 acc: 0 loss: 1.7569 grad: 1.75e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6396 data: 0.0506 lr: 4.61e-05 mem: 47% pow: 646.423 W 0: INFO 26-04-29 08:55:44.198714 - 7:38:12 - step: 19040 acc: 0 loss: 1.3603 grad: 1.58e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6496 data: 0.0942 lr: 4.61e-05 mem: 47% pow: 613.497 W 0: INFO 26-04-29 08:55:58.160489 - 7:38:26 - step: 19050 acc: 0 loss: 1.1003 grad: 1.75e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6316 data: 0.072 lr: 4.61e-05 mem: 47% pow: 639.844 W 0: INFO 26-04-29 08:56:12.203122 - 7:38:40 - step: 19060 acc: 0 loss: 1.5315 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6307 data: 0.0547 lr: 4.60e-05 mem: 47% pow: 654.52 W 0: INFO 26-04-29 08:56:26.356468 - 7:38:54 - step: 19070 acc: 0 loss: 1.423 grad: 1.48e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6431 data: 0.0721 lr: 4.60e-05 mem: 47% pow: 631.902 W 0: INFO 26-04-29 08:56:40.798604 - 7:39:09 - step: 19080 acc: 0 loss: 1.3057 grad: 1.52e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6778 data: 0.0472 lr: 4.60e-05 mem: 47% pow: 629.747 W 0: INFO 26-04-29 08:56:54.548648 - 7:39:23 - step: 19090 acc: 0 loss: 1.5696 grad: 2.04e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5998 data: 0.0725 lr: 4.60e-05 mem: 47% pow: 658.067 W 0: INFO 26-04-29 08:57:08.473637 - 7:39:37 - step: 19100 acc: 0 loss: 1.8698 grad: 1.58e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7148 data: 0.086 lr: 4.60e-05 mem: 47% pow: 582.845 W 0: INFO 26-04-29 08:57:25.535148 - 7:39:54 - step: 19110 acc: 0 loss: 1.7419 grad: 1.65e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.6683 data: 0.0714 lr: 4.60e-05 mem: 54% pow: 619.495 W 0: INFO 26-04-29 08:57:39.496684 - 7:40:08 - step: 19120 acc: 0 loss: 1.4948 grad: 1.52e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6316 data: 0.0712 lr: 4.60e-05 mem: 47% pow: 639.834 W 0: INFO 26-04-29 08:57:53.439316 - 7:40:22 - step: 19130 acc: 0 loss: 1.1078 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6831 data: 0.0217 lr: 4.59e-05 mem: 47% pow: 642.764 W 0: INFO 26-04-29 08:58:08.186243 - 7:40:36 - step: 19140 acc: 0 loss: 1.1417 grad: 1.50e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.644 data: 0.0696 lr: 4.59e-05 mem: 47% pow: 631.482 W 0: INFO 26-04-29 08:58:28.366417 - 7:40:56 - step: 19150 acc: 0 loss: 1.2298 grad: 1.46e-01 flops: 2.80e+14 wps: 3.25e+04 iter: 0.6859 data: 0.0588 lr: 4.59e-05 mem: 47% pow: 619.012 W 0: INFO 26-04-29 08:58:43.135063 - 7:41:11 - step: 19160 acc: 0 loss: 1.494 grad: 1.46e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.6092 data: 0.0848 lr: 4.59e-05 mem: 47% pow: 662.592 W 0: INFO 26-04-29 08:58:57.031711 - 7:41:25 - step: 19170 acc: 0 loss: 1.1717 grad: 1.51e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.8451 data: 0.0647 lr: 4.59e-05 mem: 47% pow: 534.519 W 0: INFO 26-04-29 09:02:19.101052 - 7:44:47 - step: 19180 acc: 0 loss: 1.3165 grad: 1.55e-01 flops: 2.79e+13 wps: 3.24e+03 iter: 0.5961 data: 0.0757 lr: 4.59e-05 mem: 47% pow: 658.188 W 0: INFO 26-04-29 09:02:33.168994 - 7:45:01 - step: 19190 acc: 0 loss: 1.0831 grad: 1.46e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6551 data: 0.0617 lr: 4.58e-05 mem: 47% pow: 630.619 W 0: INFO 26-04-29 09:02:47.014471 - 7:45:15 - step: 19200 acc: 0 loss: 1.4445 grad: 1.48e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6961 data: 0.0057 lr: 4.58e-05 mem: 47% pow: 640.476 W 0: INFO 26-04-29 09:03:03.517534 - 7:45:32 - step: 19210 acc: 0 loss: 1.2911 grad: 1.61e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6267 data: 0.0743 lr: 4.58e-05 mem: 54% pow: 644.231 W 0: INFO 26-04-29 09:03:17.292835 - 7:45:45 - step: 19220 acc: 0 loss: 1.3194 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6356 data: 0.0652 lr: 4.58e-05 mem: 47% pow: 639.069 W 0: INFO 26-04-29 09:03:31.308337 - 7:45:59 - step: 19230 acc: 0 loss: 1.6376 grad: 1.43e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6584 data: 0.0773 lr: 4.58e-05 mem: 47% pow: 624.856 W 0: INFO 26-04-29 09:03:45.063291 - 7:46:13 - step: 19240 acc: 0 loss: 1.4066 grad: 1.44e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6199 data: 0.0716 lr: 4.58e-05 mem: 47% pow: 653.541 W 0: INFO 26-04-29 09:03:59.276215 - 7:46:27 - step: 19250 acc: 0 loss: 1.458 grad: 1.47e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.7261 data: 0.07 lr: 4.58e-05 mem: 47% pow: 587.196 W 0: INFO 26-04-29 09:04:13.558959 - 7:46:42 - step: 19260 acc: 0 loss: 1.3597 grad: 1.51e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6651 data: 0.039 lr: 4.57e-05 mem: 47% pow: 642.058 W 0: INFO 26-04-29 09:04:27.406804 - 7:46:55 - step: 19270 acc: 0 loss: 1.1943 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.611 data: 0.0723 lr: 4.57e-05 mem: 47% pow: 655.259 W 0: INFO 26-04-29 09:04:41.388142 - 7:47:09 - step: 19280 acc: 0 loss: 1.4661 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6176 data: 0.0762 lr: 4.57e-05 mem: 47% pow: 655.53 W 0: INFO 26-04-29 09:04:54.965435 - 7:47:23 - step: 19290 acc: 0 loss: 1.1502 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6138 data: 0.0752 lr: 4.57e-05 mem: 47% pow: 654.788 W 0: INFO 26-04-29 09:05:08.988110 - 7:47:37 - step: 19300 acc: 0 loss: 1.2746 grad: 1.45e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.8107 data: 0.0811 lr: 4.57e-05 mem: 47% pow: 536.089 W 0: INFO 26-04-29 09:05:25.865309 - 7:47:54 - step: 19310 acc: 0 loss: 1.3112 grad: 1.47e-01 flops: 3.35e+14 wps: 3.88e+04 iter: 0.6173 data: 0.076 lr: 4.57e-05 mem: 54% pow: 646.672 W 0: INFO 26-04-29 09:05:39.697510 - 7:48:08 - step: 19320 acc: 0 loss: 1.518 grad: 1.43e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6371 data: 0.0667 lr: 4.57e-05 mem: 47% pow: 646.185 W 0: INFO 26-04-29 09:05:53.826818 - 7:48:22 - step: 19330 acc: 0 loss: 1.542 grad: 1.49e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.8403 data: 0.0744 lr: 4.56e-05 mem: 47% pow: 522.569 W 0: INFO 26-04-29 09:06:07.603700 - 7:48:36 - step: 19340 acc: 0 loss: 1.2123 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6372 data: 0.0696 lr: 4.56e-05 mem: 47% pow: 636.528 W 0: INFO 26-04-29 09:06:21.822335 - 7:48:50 - step: 19350 acc: 0 loss: 0.8917 grad: 1.50e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6298 data: 0.0802 lr: 4.56e-05 mem: 47% pow: 642.239 W 0: INFO 26-04-29 09:06:35.603339 - 7:49:04 - step: 19360 acc: 0 loss: 1.5728 grad: 1.67e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.601 data: 0.0774 lr: 4.56e-05 mem: 47% pow: 654.971 W 0: INFO 26-04-29 09:06:49.304618 - 7:49:17 - step: 19370 acc: 0 loss: 1.4077 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6398 data: 0.0723 lr: 4.56e-05 mem: 47% pow: 636.155 W 0: INFO 26-04-29 09:07:03.096228 - 7:49:31 - step: 19380 acc: 0 loss: 1.0863 grad: 1.51e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.615 data: 0.0875 lr: 4.56e-05 mem: 47% pow: 639.478 W 0: INFO 26-04-29 09:07:16.702725 - 7:49:45 - step: 19390 acc: 0 loss: 1.4222 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6227 data: 0.0665 lr: 4.55e-05 mem: 47% pow: 653.256 W 0: INFO 26-04-29 09:07:30.744642 - 7:49:59 - step: 19400 acc: 0 loss: 1.5965 grad: 1.47e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.609 data: 0.0637 lr: 4.55e-05 mem: 47% pow: 660.921 W 0: INFO 26-04-29 09:07:47.770348 - 7:50:16 - step: 19410 acc: 0 loss: 0.9336 grad: 1.53e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.6104 data: 0.0672 lr: 4.55e-05 mem: 54% pow: 653.161 W 0: INFO 26-04-29 09:08:01.452818 - 7:50:30 - step: 19420 acc: 0 loss: 1.0846 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.629 data: 0.0714 lr: 4.55e-05 mem: 47% pow: 633.622 W 0: INFO 26-04-29 09:08:15.008675 - 7:50:43 - step: 19430 acc: 0 loss: 1.5988 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6245 data: 0.0606 lr: 4.55e-05 mem: 47% pow: 653.073 W 0: INFO 26-04-29 09:08:28.967542 - 7:50:57 - step: 19440 acc: 0 loss: 1.5763 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6225 data: 0.069 lr: 4.55e-05 mem: 47% pow: 661.438 W 0: INFO 26-04-29 09:08:42.676242 - 7:51:11 - step: 19450 acc: 0 loss: 1.5985 grad: 1.83e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6407 data: 0.0703 lr: 4.55e-05 mem: 47% pow: 637.702 W 0: INFO 26-04-29 09:08:56.588131 - 7:51:25 - step: 19460 acc: 0 loss: 1.488 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6806 data: 0.073 lr: 4.54e-05 mem: 47% pow: 613.848 W 0: INFO 26-04-29 09:09:10.248855 - 7:51:38 - step: 19470 acc: 0 loss: 1.3294 grad: 1.52e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6089 data: 0.0862 lr: 4.54e-05 mem: 47% pow: 640.685 W 0: INFO 26-04-29 09:09:24.265711 - 7:51:52 - step: 19480 acc: 0 loss: 1.3878 grad: 1.53e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.8231 data: 0.0709 lr: 4.54e-05 mem: 47% pow: 537.946 W 0: INFO 26-04-29 09:09:37.825558 - 7:52:06 - step: 19490 acc: 0 loss: 1.3562 grad: 1.51e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6244 data: 0.0677 lr: 4.54e-05 mem: 47% pow: 649.906 W 0: INFO 26-04-29 09:09:51.551555 - 7:52:20 - step: 19500 acc: 0 loss: 1.5437 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6544 data: 0.0741 lr: 4.54e-05 mem: 47% pow: 624.589 W 0: INFO 26-04-29 09:10:08.437024 - 7:52:37 - step: 19510 acc: 0 loss: 1.5466 grad: 1.50e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6155 data: 0.069 lr: 4.54e-05 mem: 54% pow: 651.311 W 0: INFO 26-04-29 09:10:22.380725 - 7:52:50 - step: 19520 acc: 0 loss: 1.3228 grad: 1.72e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6775 data: 0.0694 lr: 4.54e-05 mem: 47% pow: 622.182 W 0: INFO 26-04-29 09:10:36.580561 - 7:53:05 - step: 19530 acc: 0 loss: 1.3967 grad: 1.56e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6133 data: 0.0741 lr: 4.53e-05 mem: 47% pow: 656.303 W 0: INFO 26-04-29 09:10:50.348717 - 7:53:18 - step: 19540 acc: 0 loss: 1.0523 grad: 1.59e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6463 data: 0.0721 lr: 4.53e-05 mem: 47% pow: 625.83 W 0: INFO 26-04-29 09:11:04.465860 - 7:53:33 - step: 19550 acc: 0 loss: 1.54 grad: 3.23e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.7511 data: 0.0825 lr: 4.53e-05 mem: 47% pow: 565.393 W 0: INFO 26-04-29 09:11:18.508282 - 7:53:47 - step: 19560 acc: 0 loss: 1.401 grad: 1.54e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6481 data: 0.0808 lr: 4.53e-05 mem: 47% pow: 627.091 W 0: INFO 26-04-29 09:11:32.283598 - 7:54:00 - step: 19570 acc: 0 loss: 1.4058 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6932 data: 0.0731 lr: 4.53e-05 mem: 47% pow: 601.939 W 0: INFO 26-04-29 09:11:45.806723 - 7:54:14 - step: 19580 acc: 0 loss: 1.3643 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6133 data: 0.0801 lr: 4.53e-05 mem: 47% pow: 645.381 W 0: INFO 26-04-29 09:11:59.592219 - 7:54:28 - step: 19590 acc: 0 loss: 1.6421 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6386 data: 0.0734 lr: 4.53e-05 mem: 47% pow: 632.949 W 0: INFO 26-04-29 09:12:13.428673 - 7:54:42 - step: 19600 acc: 0 loss: 1.3107 grad: 1.49e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6002 data: 0.0902 lr: 4.52e-05 mem: 47% pow: 650.547 W 0: INFO 26-04-29 09:12:30.328774 - 7:54:58 - step: 19610 acc: 0 loss: 1.529 grad: 1.47e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6595 data: 0.0716 lr: 4.52e-05 mem: 54% pow: 620.911 W 0: WARNING 26-04-29 14:10:02.989359 - 0:00:00 - Signal handler installed. 0: WARNING 26-04-29 14:10:02.989794 - 0:00:00 - WARNING: Setting MKL_SERVICE_FORCE_INTEL to GNU 0: WARNING 26-04-29 14:10:02.989893 - 0:00:00 - WARNING: Setting MKL_NUM_THREADS to 1 0: WARNING 26-04-29 14:10:02.989961 - 0:00:00 - WARNING: Setting ENABLE_INTRA_NODE_COMM to 1 0: WARNING 26-04-29 14:10:02.990015 - 0:00:00 - WARNING: Setting TORCH_NCCL_AVOID_RECORD_STREAMS to 1 0: WARNING 26-04-29 14:10:02.990070 - 0:00:00 - WARNING: Setting NCCL_IB_TIMEOUT to 22 0: WARNING 26-04-29 14:10:02.990121 - 0:00:00 - WARNING: Setting NCCL_DEBUG to INFO 0: WARNING 26-04-29 14:10:02.990171 - 0:00:00 - WARNING: Setting TRITON_CACHE_DIR to /scratch/local/xun/tmp/tmpa6f1p8ti 0: INFO 26-04-29 14:10:13.249352 - 0:00:10 - Run launched with torchrun, local rank: 0 0: INFO 26-04-29 14:10:13.250154 - 0:00:10 - ENV: environ({'SHELL': '/bin/bash', '__EGL_VENDOR_LIBRARY_DIRS': '/home/xun/anaconda3/share/glvnd/egl_vendor.d', 'COLORTERM': 'truecolor', 'SLURM_STEP_NUM_TASKS': '4', 'PYENV_SHELL': 'bash', 'SLURM_JOB_USER': 'xun', 'SLURM_TASKS_PER_NODE': '1(x4)', 'PYTHONUNBUFFERED': '1', 'SLURM_JOB_UID': '1005', 'OLD_PATH': '/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/shims:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'SLURM_STEP_GPUS': '0,1,2,3,4,5,6,7', 'NVM_INC': '/home/xun/.nvm/versions/node/v22.22.2/include/node', 'TERM_PROGRAM_VERSION': '3.1.15', 'SLURM_CPU_BIND': 'quiet,mask_cpu:0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'HPCX_HCOLL_DIR': '/opt/hpcx/hcoll', 'SLURM_TASK_PID': '1153992', 'CONDA_EXE': '/home/xun/anaconda3/bin/conda', '_CE_M': '', 'PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'SLURM_JOB_GPUS': '0,1,2,3,4,5,6,7', 'SLURM_LOCALID': '0', 'PYTHONNOUSERSITE': '1', 'SLURM_SUBMIT_DIR': '/home/xun/rsadhukh/STEM', 'SLURM_CPU_BIND_VERBOSE': 'quiet', 'HOSTNAME': 'compute-node-14', 'HPCX_CLUSTERKIT_DIR': '/opt/hpcx/clusterkit', 'SLURMD_NODENAME': 'compute-node-14', 'MASTER_PORT': '29500', 'SLURM_JOB_START_TIME': '1777471771', 'TORCH_NCCL_TIMEOUT': '1200', 'HYDRA_LAUNCHER_EXTRA_ARGS': '--external-launcher', 'OMPI_HOME': '/opt/hpcx/ompi', 'HPCX_OSU_CUDA_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks-cuda', 'SLURM_STEP_NODELIST': 'compute-node-[14,0,43-44]', 'TRAINING_LOG_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'WANDB_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'SLURM_CLUSTER_NAME': 'cluster', 'SLURM_JOB_END_TIME': '1777644571', 'SLURM_CPUS_ON_NODE': '128', 'SLURM_UMASK': '0000', 'HPCX_OSU_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks', 'SLURM_JOB_CPUS_PER_NODE': '128(x4)', 'HPCX_MPI_DIR': '/opt/hpcx/ompi', 'HPCX_OSHMEM_DIR': '/opt/hpcx/ompi', 'SLURM_GPUS_ON_NODE': '8', 'PWD': '/home/xun/rsadhukh/STEM', 'HPCX_UCC_DIR': '/opt/hpcx/ucc', 'PRTE_MCA_plm_slurm_args': '--external-launcher', 'SLURM_GTIDS': '0', 'GSETTINGS_SCHEMA_DIR': '/home/xun/anaconda3/share/glib-2.0/schemas', 'LOGNAME': 'xun', 'XDG_SESSION_TYPE': 'tty', 'CONDA_PREFIX': '/home/xun/anaconda3', 'SLURM_JOB_PARTITION': 'high', 'MODULESHOME': '/usr/share/modules', 'MANPATH': '/home/xun/.nvm/versions/node/v22.22.2/share/man::', 'SLURM_TRES_PER_TASK': 'cpu:128', 'GSETTINGS_SCHEMA_DIR_CONDA_BACKUP': '', 'SLURM_JOB_NUM_NODES': '4', 'SRUN_DEBUG': '3', 'SLURM_STEPID': '0', 'SLURM_CPU_BIND_LIST': '0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'VSCODE_GIT_ASKPASS_NODE': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/node', 'SLURM_JOBID': '29527', 'GLOO_SOCKET_IFNAME': 'ens7', 'WORLD_SIZE': '32', 'SLURM_LAUNCH_NODE_IPADDR': '172.27.49.7', 'I_MPI_HYDRA_BOOTSTRAP_EXEC_EXTRA_ARGS': '--external-launcher', 'OLD_PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'MPI_HOME': '/opt/hpcx/ompi', 'MOTD_SHOWN': 'pam', 'TORCH_LOGS': 'recompiles,graph_breaks,dynamo,inductor', 'HOME': '/home/xun', 'LANG': 'C.UTF-8', 'SLURM_CPU_BIND_TYPE': 'mask_cpu:', 'LS_COLORS': 'rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.webp=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:', 'OSHMEM_HOME': '/opt/hpcx/ompi', 'SLURMD_DEBUG': '2', 'SLURM_PROCID': '0', 'OLD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'VIRTUAL_ENV': '/home/xun/rsadhukh/STEM/stem', 'SSL_CERT_DIR': '/usr/lib/ssl/certs', 'HPCX_UCX_DIR': '/opt/hpcx/ucx', 'CONDA_PROMPT_MODIFIER': '(base) ', 'TMPDIR': '/scratch/local/xun/tmp', 'GIT_ASKPASS': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass.sh', 'VSCODE_GIT_IPC_AUTH_TOKEN': 'e9c91a1bab37ff9482f8c1a25d24a2b678ee98e75266f48ee778bb93a29d0880', 'SLURM_CPUS_PER_TASK': '128', 'SLURM_NTASKS': '4', 'CONFIG_PATH': 'apps/main/configs/olmo2_1B_midfine.yaml', 'SLURM_TOPOLOGY_ADDR': 'compute-node-14', 'SSH_CONNECTION': '67.163.187.8 64380 172.27.51.97 22', 'OLD_CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'SLURM_DISTRIBUTION': 'cyclic', 'ROOT_MODEL_DIR': '/data/rsadhukh/checkpoints', 'PYTORCH_CUDA_ALLOC_CONF': 'expandable_segments:True', 'HYDRA_BOOTSTRAP': 'slurm', 'SHMEM_HOME': '/opt/hpcx/ompi', 'NVM_DIR': '/home/xun/.nvm', 'MASTER_ADDR': 'compute-node-14', 'VSCODE_GIT_ASKPASS_EXTRA_ARGS': '', 'CUDA_VISIBLE_DEVICES': '0,1,2,3,4,5,6,7', 'SLURM_TOPOLOGY_ADDR_PATTERN': 'node', 'SLURM_SRUN_COMM_HOST': '172.27.49.7', '_CONDA_EXE': '/home/xun/anaconda3/bin/conda', 'LESSCLOSE': '/usr/bin/lesspipe %s %s', '_CONDA_ROOT': '/home/xun/anaconda3', 'XDG_SESSION_CLASS': 'user', 'PYTHONPATH': '/home/xun/rsadhukh/STEM:', 'TERM': 'xterm-256color', '_CE_CONDA': '', 'LESSOPEN': '| /usr/bin/lesspipe %s', 'USER': 'xun', 'LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'HPCX_SHARP_DIR': '/opt/hpcx/sharp', 'SLURM_NODELIST': 'compute-node-[14,0,43-44]', 'WANDB_API_KEY': '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', 'VSCODE_GIT_IPC_HANDLE': '/run/user/1005/vscode-git-21eb2adf6a.sock', 'ENVIRONMENT': 'BATCH', 'CONDA_SHLVL': '1', 'SLURM_SRUN_COMM_PORT': '46439', 'NODES': '4', 'EXP_NAME': 'midfine_base_final', 'LOADEDMODULES': '', 'TEMP': '/scratch/local/xun/tmp', 'SLURM_STEP_ID': '0', 'SLURM_PRIO_PROCESS': '0', 'SLURM_NPROCS': '4', 'SHLVL': '3', 'NVM_CD_FLAGS': '', 'SLURM_NNODES': '4', 'WANDB_MODE': 'online', 'HPCX_DIR': '/opt/hpcx', 'XDG_SESSION_ID': '1916', 'VIRTUAL_ENV_PROMPT': '(stem) ', 'TORCHINDUCTOR_COMPILE_THREADS': '32', 'SLURM_SUBMIT_HOST': 'login-node-0', 'CONDA_PYTHON_EXE': '/home/xun/anaconda3/bin/python', 'LD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'NCCL_IB_DISABLE': '0', 'XDG_RUNTIME_DIR': '/run/user/1005', 'SLURM_JOB_ID': '29527', 'SSL_CERT_FILE': '/usr/lib/ssl/certs/ca-certificates.crt', 'SLURM_NODEID': '0', 'PS1': '(stem) ', 'SLURM_STEP_NUM_NODES': '4', 'SSH_CLIENT': '67.163.187.8 64380 22', 'CONDA_DEFAULT_ENV': 'base', 'PYENV_ROOT': '/opt/pyenv', 'OPAL_PREFIX': '/opt/hpcx/ompi', 'OMP_NUM_THREADS': '1', 'OLD_LD_LIBRARY_PATH': '/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'SLURM_STEP_TASKS_PER_NODE': '1(x4)', 'WORLD_MODEL_LOG_LEVEL': 'DEBUG', 'VSCODE_GIT_ASKPASS_MAIN': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass-main.js', 'CUDA_HOME': '/usr/local/cuda-12.8', 'DATA_ROOT_DIR': '/home/xun/rsadhukh/STEM/data', 'XDG_DATA_DIRS': '/usr/local/share:/usr/share:/var/lib/snapd/desktop', 'NPROC_PER_NODE': '8', 'TORCH_FR_BUFFER_SIZE': '32', 'TMP': '/scratch/local/xun/tmp', 'BROWSER': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/helpers/browser.sh', 'SLURM_CONF': '/var/spool/slurmd/conf-cache/slurm.conf', 'PATH': '/home/xun/rsadhukh/STEM/stem/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/shims:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'HPCX_NCCL_RDMA_SHARP_PLUGIN_DIR': '/opt/hpcx/nccl_rdma_sharp_plugin', 'SLURM_JOB_NAME': 'stem', 'MODULEPATH': '/etc/environment-modules/modules:/usr/share/modules/versions:/usr/share/modules/$MODULE_VERSION/modulefiles:/usr/share/modules/modulefiles', 'SLURM_NTASKS_PER_NODE': '1', 'HPCX_MPI_TESTS_DIR': '/opt/hpcx/ompi/tests', 'DBUS_SESSION_BUS_ADDRESS': 'unix:path=/run/user/1005/bus', 'OLD_OPAL_PREFIX': '/opt/hpcx/ompi', 'NVM_BIN': '/home/xun/.nvm/versions/node/v22.22.2/bin', 'SLURM_STEP_LAUNCHER_PORT': '46439', 'OMPI_MCA_plm_slurm_args': '--external-launcher', 'SLURM_JOB_GID': '1005', 'CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'HF_ALLOW_CODE_EVAL': '1', 'OVSX_REGISTRY_URL': 'https://open-vsx.org', 'OLDPWD': '/home/xun/rsadhukh/STEM', 'SLURM_JOB_NODELIST': 'compute-node-[14,0,43-44]', 'MODULES_CMD': '/usr/lib/x86_64-linux-gnu/modulecmd.tcl', 'TERM_PROGRAM': 'vscode', 'SLURM_OUTPUT_MODE': 'standard', 'VSCODE_IPC_HOOK_CLI': '/run/user/1005/vscode-ipc-6e7881a1-db52-4a0c-a6a0-9765d1799424.sock', 'I_MPI_HYDRA_BOOTSTRAP': 'slurm', 'BASH_FUNC_ml%%': '() { module ml "$@"\n}', 'BASH_FUNC_module%%': '() { eval `/usr/bin/tclsh8.6 /usr/lib/x86_64-linux-gnu/modulecmd.tcl bash "$@"`;\n _mlstatus=$?;\n return $_mlstatus\n}', '_': '/usr/bin/stdbuf', '_STDBUF_O': 'L', '_STDBUF_E': 'L', 'LD_PRELOAD': '/usr/libexec/coreutils/libstdbuf.so', 'LOCAL_RANK': '0', 'RANK': '0', 'GROUP_RANK': '0', 'ROLE_RANK': '0', 'ROLE_NAME': 'default', 'LOCAL_WORLD_SIZE': '8', 'GROUP_WORLD_SIZE': '4', 'ROLE_WORLD_SIZE': '32', 'TORCHELASTIC_RESTART_COUNT': '0', 'TORCHELASTIC_MAX_RESTARTS': '0', 'TORCHELASTIC_RUN_ID': 'none', 'TORCHELASTIC_USE_AGENT_STORE': 'True', 'TORCH_NCCL_ASYNC_ERROR_HANDLING': '1', 'TORCHELASTIC_ERROR_FILE': '/scratch/local/xun/tmp/torchelastic_kojn6cmb/none_mcpp2qd6/attempt_0/0/error.json', 'CUDA_MODULE_LOADING': 'LAZY', 'TORCHINDUCTOR_CACHE_DIR': '/scratch/local/xun/tmp/torchinductor_xun', 'KMP_DUPLICATE_LIB_OK': 'True', 'KMP_INIT_AT_FORK': 'FALSE', 'MKL_SERVICE_FORCE_INTEL': 'GNU', 'MKL_NUM_THREADS': '1', 'ENABLE_INTRA_NODE_COMM': '1', 'TORCH_NCCL_AVOID_RECORD_STREAMS': '1', 'NCCL_IB_TIMEOUT': '22', 'NCCL_DEBUG': 'INFO', 'TRITON_CACHE_DIR': '/scratch/local/xun/tmp/tmpa6f1p8ti'}) 0: INFO 26-04-29 14:10:21.125828 - 0:00:18 - Starting job: olmo2_1B_midfine 0: INFO 26-04-29 14:10:21.126080 - 0:00:18 - Running on dp rank : 0 0: INFO 26-04-29 14:10:21.126119 - 0:00:18 - Running on dp size : 32 0: INFO 26-04-29 14:10:21.126156 - 0:00:18 - Using model type: olmo3 (OLMo3LMTransformer) 0: INFO 26-04-29 14:10:21.128822 - 0:00:18 - Building model 0: INFO 26-04-29 14:10:21.144741 - 0:00:18 - Model is built ! 0: WARNING 26-04-29 14:10:21.339962 - 0:00:18 - Model parameter layers.0.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.340706 - 0:00:18 - Model parameter layers.0.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.341283 - 0:00:18 - Model parameter layers.0.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.341799 - 0:00:18 - Model parameter layers.0.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.342248 - 0:00:18 - Model parameter layers.0.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.342714 - 0:00:18 - Model parameter layers.0.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.343238 - 0:00:18 - Model parameter layers.0.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.343755 - 0:00:18 - Model parameter layers.0.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.344187 - 0:00:18 - Model parameter layers.0.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.344451 - 0:00:18 - Model parameter layers.0.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.344714 - 0:00:18 - Model parameter layers.0.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.345045 - 0:00:18 - Model parameter layers.1.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.345424 - 0:00:18 - Model parameter layers.1.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.345731 - 0:00:18 - Model parameter layers.1.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.346013 - 0:00:18 - Model parameter layers.1.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.346246 - 0:00:18 - Model parameter layers.1.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.346471 - 0:00:18 - Model parameter layers.1.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.346800 - 0:00:18 - Model parameter layers.1.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.347208 - 0:00:18 - Model parameter layers.1.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.347517 - 0:00:18 - Model parameter layers.1.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.347768 - 0:00:18 - Model parameter layers.1.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.347996 - 0:00:18 - Model parameter layers.1.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.348260 - 0:00:18 - Model parameter layers.2.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.348524 - 0:00:18 - Model parameter layers.2.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.348789 - 0:00:18 - Model parameter layers.2.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.349052 - 0:00:18 - Model parameter layers.2.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.349274 - 0:00:18 - Model parameter layers.2.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.349496 - 0:00:18 - Model parameter layers.2.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.349765 - 0:00:18 - Model parameter layers.2.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.350034 - 0:00:18 - Model parameter layers.2.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.350286 - 0:00:18 - Model parameter layers.2.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.350516 - 0:00:18 - Model parameter layers.2.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.350760 - 0:00:18 - Model parameter layers.2.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.351037 - 0:00:18 - Model parameter layers.3.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.351306 - 0:00:18 - Model parameter layers.3.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.351573 - 0:00:18 - Model parameter layers.3.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.351850 - 0:00:18 - Model parameter layers.3.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.352072 - 0:00:18 - Model parameter layers.3.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.352302 - 0:00:18 - Model parameter layers.3.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.352568 - 0:00:18 - Model parameter layers.3.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.352838 - 0:00:18 - Model parameter layers.3.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.353092 - 0:00:18 - Model parameter layers.3.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.353311 - 0:00:18 - Model parameter layers.3.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.353536 - 0:00:18 - Model parameter layers.3.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.353810 - 0:00:18 - Model parameter layers.4.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.354070 - 0:00:18 - Model parameter layers.4.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.354328 - 0:00:18 - Model parameter layers.4.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.354597 - 0:00:18 - Model parameter layers.4.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.354846 - 0:00:18 - Model parameter layers.4.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.355075 - 0:00:18 - Model parameter layers.4.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.355335 - 0:00:18 - Model parameter layers.4.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.355599 - 0:00:18 - Model parameter layers.4.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.355870 - 0:00:18 - Model parameter layers.4.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.356091 - 0:00:18 - Model parameter layers.4.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.356305 - 0:00:18 - Model parameter layers.4.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.356571 - 0:00:18 - Model parameter layers.5.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.356843 - 0:00:18 - Model parameter layers.5.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.357112 - 0:00:18 - Model parameter layers.5.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.357374 - 0:00:18 - Model parameter layers.5.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.357603 - 0:00:18 - Model parameter layers.5.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.357831 - 0:00:18 - Model parameter layers.5.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.358094 - 0:00:18 - Model parameter layers.5.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.358359 - 0:00:18 - Model parameter layers.5.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.358627 - 0:00:18 - Model parameter layers.5.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.358888 - 0:00:18 - Model parameter layers.5.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.359117 - 0:00:18 - Model parameter layers.5.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.359382 - 0:00:18 - Model parameter layers.6.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.359646 - 0:00:18 - Model parameter layers.6.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.359916 - 0:00:18 - Model parameter layers.6.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.360174 - 0:00:18 - Model parameter layers.6.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.360391 - 0:00:18 - Model parameter layers.6.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.360636 - 0:00:18 - Model parameter layers.6.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.360912 - 0:00:18 - Model parameter layers.6.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.361177 - 0:00:18 - Model parameter layers.6.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.361443 - 0:00:18 - Model parameter layers.6.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.361683 - 0:00:18 - Model parameter layers.6.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.361909 - 0:00:18 - Model parameter layers.6.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.362184 - 0:00:18 - Model parameter layers.7.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.362446 - 0:00:18 - Model parameter layers.7.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.362720 - 0:00:18 - Model parameter layers.7.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.363008 - 0:00:18 - Model parameter layers.7.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.363232 - 0:00:18 - Model parameter layers.7.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.363460 - 0:00:18 - Model parameter layers.7.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.363740 - 0:00:18 - Model parameter layers.7.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.364010 - 0:00:18 - Model parameter layers.7.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.364275 - 0:00:18 - Model parameter layers.7.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.364503 - 0:00:18 - Model parameter layers.7.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.364734 - 0:00:18 - Model parameter layers.7.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.365002 - 0:00:18 - Model parameter layers.8.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.365254 - 0:00:18 - Model parameter layers.8.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.365520 - 0:00:18 - Model parameter layers.8.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.365791 - 0:00:18 - Model parameter layers.8.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.366009 - 0:00:18 - Model parameter layers.8.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.366223 - 0:00:18 - Model parameter layers.8.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.366483 - 0:00:18 - Model parameter layers.8.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.366761 - 0:00:18 - Model parameter layers.8.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.367032 - 0:00:18 - Model parameter layers.8.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.367275 - 0:00:18 - Model parameter layers.8.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.367504 - 0:00:18 - Model parameter layers.8.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.367776 - 0:00:18 - Model parameter layers.9.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.368034 - 0:00:18 - Model parameter layers.9.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.368288 - 0:00:18 - Model parameter layers.9.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.368567 - 0:00:18 - Model parameter layers.9.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.368800 - 0:00:18 - Model parameter layers.9.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.369019 - 0:00:18 - Model parameter layers.9.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.369290 - 0:00:18 - Model parameter layers.9.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.369566 - 0:00:18 - Model parameter layers.9.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.369837 - 0:00:18 - Model parameter layers.9.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.370063 - 0:00:18 - Model parameter layers.9.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.370281 - 0:00:18 - Model parameter layers.9.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.370546 - 0:00:18 - Model parameter layers.10.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.371031 - 0:00:18 - Model parameter layers.10.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.371479 - 0:00:18 - Model parameter layers.10.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.371887 - 0:00:18 - Model parameter layers.10.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.372159 - 0:00:18 - Model parameter layers.10.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.372396 - 0:00:18 - Model parameter layers.10.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.372667 - 0:00:18 - Model parameter layers.10.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.372931 - 0:00:18 - Model parameter layers.10.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.373201 - 0:00:18 - Model parameter layers.10.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.373423 - 0:00:18 - Model parameter layers.10.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.373661 - 0:00:18 - Model parameter layers.10.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.373932 - 0:00:18 - Model parameter layers.11.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.374197 - 0:00:18 - Model parameter layers.11.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.374463 - 0:00:18 - Model parameter layers.11.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.374759 - 0:00:18 - Model parameter layers.11.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.375029 - 0:00:18 - Model parameter layers.11.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.375257 - 0:00:18 - Model parameter layers.11.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.375535 - 0:00:18 - Model parameter layers.11.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.375806 - 0:00:18 - Model parameter layers.11.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.376081 - 0:00:18 - Model parameter layers.11.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.376302 - 0:00:18 - Model parameter layers.11.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.376532 - 0:00:18 - Model parameter layers.11.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.376805 - 0:00:18 - Model parameter layers.12.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.377072 - 0:00:18 - Model parameter layers.12.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.377333 - 0:00:18 - Model parameter layers.12.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.377605 - 0:00:18 - Model parameter layers.12.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.377833 - 0:00:18 - Model parameter layers.12.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.378051 - 0:00:18 - Model parameter layers.12.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.378318 - 0:00:18 - Model parameter layers.12.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.378592 - 0:00:18 - Model parameter layers.12.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.378882 - 0:00:18 - Model parameter layers.12.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.379120 - 0:00:18 - Model parameter layers.12.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.379354 - 0:00:18 - Model parameter layers.12.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.379630 - 0:00:18 - Model parameter layers.13.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.379900 - 0:00:18 - Model parameter layers.13.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.380159 - 0:00:18 - Model parameter layers.13.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.380421 - 0:00:18 - Model parameter layers.13.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.380657 - 0:00:18 - Model parameter layers.13.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.380882 - 0:00:18 - Model parameter layers.13.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.381152 - 0:00:18 - Model parameter layers.13.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.381417 - 0:00:18 - Model parameter layers.13.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.381679 - 0:00:18 - Model parameter layers.13.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.381908 - 0:00:18 - Model parameter layers.13.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.382128 - 0:00:18 - Model parameter layers.13.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.382389 - 0:00:18 - Model parameter layers.14.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.382658 - 0:00:18 - Model parameter layers.14.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.382947 - 0:00:18 - Model parameter layers.14.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.383224 - 0:00:18 - Model parameter layers.14.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.383448 - 0:00:18 - Model parameter layers.14.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.383686 - 0:00:18 - Model parameter layers.14.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.383948 - 0:00:18 - Model parameter layers.14.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.384209 - 0:00:18 - Model parameter layers.14.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.384469 - 0:00:18 - Model parameter layers.14.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.384711 - 0:00:18 - Model parameter layers.14.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.384933 - 0:00:18 - Model parameter layers.14.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.385197 - 0:00:18 - Model parameter layers.15.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.385460 - 0:00:18 - Model parameter layers.15.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.385741 - 0:00:18 - Model parameter layers.15.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.386009 - 0:00:18 - Model parameter layers.15.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.386231 - 0:00:18 - Model parameter layers.15.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.386446 - 0:00:18 - Model parameter layers.15.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.386716 - 0:00:18 - Model parameter layers.15.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.387062 - 0:00:18 - Model parameter layers.15.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.387335 - 0:00:18 - Model parameter layers.15.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.387582 - 0:00:18 - Model parameter layers.15.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.387814 - 0:00:18 - Model parameter layers.15.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.388322 - 0:00:18 - Model parameter tok_embeddings.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.388601 - 0:00:18 - Model parameter norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.388912 - 0:00:18 - Model parameter output.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 14:10:21.389211 - 0:00:18 - Model parameter rope_embeddings.freqs_cis is all zeros: it might be because of a missing initialization 0: INFO 26-04-29 14:10:21.389505 - 0:00:18 - Model size: 1,484,916,736 total parameters 0: INFO 26-04-29 14:10:21.389825 - 0:00:18 - GPU capacity: NVIDIA H200 (0) with 139.80GiB memory 0: INFO 26-04-29 14:10:21.394242 - 0:00:18 - GPU memory usage: NVIDIA H200 (0): 139.80084228515625 GiB capacity, 0.208984375 GiB peak, 0.14948720736154641% peak 0: INFO 26-04-29 14:10:21.394347 - 0:00:18 - Starting build of optimizer... 0: INFO 26-04-29 14:10:21.395012 - 0:00:18 - Done with build of optimizer. 0: INFO 26-04-29 14:10:21.395080 - 0:00:18 - Using global DP dataloader sharding: rank 0/32 0: INFO 26-04-29 14:10:22.529371 - 0:00:20 - Loading initial model & optimizer from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ 0: INFO 26-04-29 14:10:37.255762 - 0:00:34 - Reloading train state 0: INFO 26-04-29 14:10:37.267544 - 0:00:34 - Train state reloaded 0: INFO 26-04-29 14:10:37.267641 - 0:00:34 - Loading from: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000 0: INFO 26-04-29 14:10:39.642141 - 0:00:37 - Model and optim reloaded 0: DEBUG 26-04-29 14:10:39.649667 - 0:00:37 - Using selector: EpollSelector 0: DEBUG 26-04-29 14:10:39.732259 - 0:00:37 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 14:10:39.748432 - 0:00:37 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 14:10:39.753328 - 0:00:37 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 14:10:39.756215 - 0:00:37 - Popen(['git', 'rev-parse', '--show-toplevel'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 14:10:39.767082 - 0:00:37 - Starting new HTTPS connection (1): api.wandb.ai:443 0: DEBUG 26-04-29 14:10:40.706009 - 0:00:38 - https://api.wandb.ai:443 "POST /graphql HTTP/1.1" 200 None 0: DEBUG 26-04-29 14:10:41.004075 - 0:00:38 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 14:10:41.007132 - 0:00:38 - Popen(['git', 'cat-file', '--batch-check'], cwd=/home/xun/rsadhukh/STEM, stdin=, shell=False, universal_newlines=False) 0: INFO 26-04-29 14:10:43.068959 - 0:00:40 - Loading data loader... 0: WARNING 26-04-29 14:10:43.069625 - 0:00:40 - track_packed_source_mixture=True: source counts are updated in the dataloader process only; forcing synchronous dataloader (load_async=False) for this run. 0: INFO 26-04-29 14:10:43.069917 - 0:00:40 - Loaded data loader! 0: INFO 26-04-29 14:10:43.070025 - 0:00:40 - Profiling active. Traces will be saved at /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling 0: INFO 26-04-29 14:10:43.070517 - 0:00:40 - Created trace directory! 0: INFO 26-04-29 14:10:43.070637 - 0:00:40 - Waiting at profiler barrier... 0: INFO 26-04-29 14:10:43.071424 - 0:00:40 - Profiler barrier passed 0: INFO 26-04-29 14:10:44.132354 - 0:00:41 - Using vocab_size=100352 from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/config.json (tokenizer has 100278 tokens) 0: INFO 26-04-29 14:10:44.133686 - 0:00:41 - HuggingFace tokenizer loaded from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ – #words: 100352, BOS ID: 100257, EOS ID: 100257 0: WARNING 26-04-29 15:35:19.703293 - 0:00:00 - Signal handler installed. 0: WARNING 26-04-29 15:35:19.703665 - 0:00:00 - WARNING: Setting MKL_SERVICE_FORCE_INTEL to GNU 0: WARNING 26-04-29 15:35:19.703766 - 0:00:00 - WARNING: Setting MKL_NUM_THREADS to 1 0: WARNING 26-04-29 15:35:19.703844 - 0:00:00 - WARNING: Setting ENABLE_INTRA_NODE_COMM to 1 0: WARNING 26-04-29 15:35:19.703905 - 0:00:00 - WARNING: Setting TORCH_NCCL_AVOID_RECORD_STREAMS to 1 0: WARNING 26-04-29 15:35:19.703967 - 0:00:00 - WARNING: Setting NCCL_IB_TIMEOUT to 22 0: WARNING 26-04-29 15:35:19.704026 - 0:00:00 - WARNING: Setting NCCL_DEBUG to INFO 0: WARNING 26-04-29 15:35:19.704087 - 0:00:00 - WARNING: Setting TRITON_CACHE_DIR to /scratch/local/xun/tmp/tmpfxgobe_y 0: INFO 26-04-29 15:35:30.599434 - 0:00:11 - Run launched with torchrun, local rank: 0 0: INFO 26-04-29 15:35:30.600233 - 0:00:11 - ENV: environ({'SHELL': '/bin/bash', '__EGL_VENDOR_LIBRARY_DIRS': '/home/xun/anaconda3/share/glvnd/egl_vendor.d', 'COLORTERM': 'truecolor', 'SLURM_STEP_NUM_TASKS': '4', 'PYENV_SHELL': 'bash', 'SLURM_JOB_USER': 'xun', 'SLURM_TASKS_PER_NODE': '1(x4)', 'PYTHONUNBUFFERED': '1', 'SLURM_JOB_UID': '1005', 'OLD_PATH': '/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/shims:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'SLURM_STEP_GPUS': '0,1,2,3,4,5,6,7', 'NVM_INC': '/home/xun/.nvm/versions/node/v22.22.2/include/node', 'TERM_PROGRAM_VERSION': '3.1.15', 'SLURM_CPU_BIND': 'quiet,mask_cpu:0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'HPCX_HCOLL_DIR': '/opt/hpcx/hcoll', 'SLURM_TASK_PID': '469971', 'CONDA_EXE': '/home/xun/anaconda3/bin/conda', '_CE_M': '', 'PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'SLURM_JOB_GPUS': '0,1,2,3,4,5,6,7', 'SLURM_LOCALID': '0', 'PYTHONNOUSERSITE': '1', 'SLURM_SUBMIT_DIR': '/home/xun/rsadhukh/STEM', 'SLURM_CPU_BIND_VERBOSE': 'quiet', 'HOSTNAME': 'compute-node-3', 'HPCX_CLUSTERKIT_DIR': '/opt/hpcx/clusterkit', 'SLURMD_NODENAME': 'compute-node-3', 'MASTER_PORT': '29500', 'SLURM_JOB_START_TIME': '1777476890', 'TORCH_NCCL_TIMEOUT': '1200', 'HYDRA_LAUNCHER_EXTRA_ARGS': '--external-launcher', 'OMPI_HOME': '/opt/hpcx/ompi', 'HPCX_OSU_CUDA_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks-cuda', 'SLURM_STEP_NODELIST': 'compute-node-[3,7,46-47]', 'TRAINING_LOG_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'WANDB_DIR': '/home/xun/rsadhukh/STEM/logs/midfine_base_final', 'SLURM_CLUSTER_NAME': 'cluster', 'SLURM_JOB_END_TIME': '1777649690', 'SLURM_CPUS_ON_NODE': '128', 'SLURM_UMASK': '0000', 'HPCX_OSU_DIR': '/opt/hpcx/ompi/tests/osu-micro-benchmarks', 'SLURM_JOB_CPUS_PER_NODE': '128(x4)', 'HPCX_MPI_DIR': '/opt/hpcx/ompi', 'HPCX_OSHMEM_DIR': '/opt/hpcx/ompi', 'SLURM_GPUS_ON_NODE': '8', 'PWD': '/home/xun/rsadhukh/STEM', 'HPCX_UCC_DIR': '/opt/hpcx/ucc', 'PRTE_MCA_plm_slurm_args': '--external-launcher', 'SLURM_GTIDS': '0', 'GSETTINGS_SCHEMA_DIR': '/home/xun/anaconda3/share/glib-2.0/schemas', 'LOGNAME': 'xun', 'XDG_SESSION_TYPE': 'tty', 'CONDA_PREFIX': '/home/xun/anaconda3', 'SLURM_JOB_PARTITION': 'high', 'MODULESHOME': '/usr/share/modules', 'MANPATH': '/home/xun/.nvm/versions/node/v22.22.2/share/man::', 'SLURM_TRES_PER_TASK': 'cpu:128', 'GSETTINGS_SCHEMA_DIR_CONDA_BACKUP': '', 'SLURM_JOB_NUM_NODES': '4', 'SRUN_DEBUG': '3', 'SLURM_STEPID': '0', 'SLURM_CPU_BIND_LIST': '0x000000FFFFFFFFFFFFFFFF000000FFFFFFFFFFFFFFFF', 'VSCODE_GIT_ASKPASS_NODE': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/node', 'SLURM_JOBID': '29546', 'GLOO_SOCKET_IFNAME': 'ens7', 'WORLD_SIZE': '32', 'SLURM_LAUNCH_NODE_IPADDR': '172.27.61.166', 'I_MPI_HYDRA_BOOTSTRAP_EXEC_EXTRA_ARGS': '--external-launcher', 'OLD_PKG_CONFIG_PATH': '/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:/opt/hpcx/hcoll/lib/pkgconfig:/opt/hpcx/sharp/lib/pkgconfig:/opt/hpcx/ucx/lib/pkgconfig:/opt/hpcx/ompi/lib/pkgconfig:', 'MPI_HOME': '/opt/hpcx/ompi', 'MOTD_SHOWN': 'pam', 'TORCH_LOGS': 'recompiles,graph_breaks,dynamo,inductor', 'HOME': '/home/xun', 'LANG': 'C.UTF-8', 'SLURM_CPU_BIND_TYPE': 'mask_cpu:', 'LS_COLORS': 'rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.webp=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:', 'OSHMEM_HOME': '/opt/hpcx/ompi', 'SLURMD_DEBUG': '2', 'SLURM_PROCID': '0', 'OLD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'VIRTUAL_ENV': '/home/xun/rsadhukh/STEM/stem', 'SSL_CERT_DIR': '/usr/lib/ssl/certs', 'HPCX_UCX_DIR': '/opt/hpcx/ucx', 'CONDA_PROMPT_MODIFIER': '(base) ', 'TMPDIR': '/scratch/local/xun/tmp', 'GIT_ASKPASS': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass.sh', 'VSCODE_GIT_IPC_AUTH_TOKEN': 'e9c91a1bab37ff9482f8c1a25d24a2b678ee98e75266f48ee778bb93a29d0880', 'SLURM_CPUS_PER_TASK': '128', 'SLURM_NTASKS': '4', 'CONFIG_PATH': 'apps/main/configs/olmo2_1B_midfine.yaml', 'SLURM_TOPOLOGY_ADDR': 'compute-node-3', 'SSH_CONNECTION': '67.163.187.8 64380 172.27.51.97 22', 'OLD_CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'SLURM_DISTRIBUTION': 'cyclic', 'ROOT_MODEL_DIR': '/data/rsadhukh/checkpoints', 'PYTORCH_CUDA_ALLOC_CONF': 'expandable_segments:True', 'HYDRA_BOOTSTRAP': 'slurm', 'SHMEM_HOME': '/opt/hpcx/ompi', 'NVM_DIR': '/home/xun/.nvm', 'MASTER_ADDR': 'compute-node-3', 'VSCODE_GIT_ASKPASS_EXTRA_ARGS': '', 'CUDA_VISIBLE_DEVICES': '0,1,2,3,4,5,6,7', 'SLURM_TOPOLOGY_ADDR_PATTERN': 'node', 'SLURM_SRUN_COMM_HOST': '172.27.61.166', '_CONDA_EXE': '/home/xun/anaconda3/bin/conda', 'LESSCLOSE': '/usr/bin/lesspipe %s %s', '_CONDA_ROOT': '/home/xun/anaconda3', 'XDG_SESSION_CLASS': 'user', 'PYTHONPATH': '/home/xun/rsadhukh/STEM:', 'TERM': 'xterm-256color', '_CE_CONDA': '', 'LESSOPEN': '| /usr/bin/lesspipe %s', 'USER': 'xun', 'LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ompi/lib:/opt/hpcx/sharp/lib:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:', 'HPCX_SHARP_DIR': '/opt/hpcx/sharp', 'SLURM_NODELIST': 'compute-node-[3,7,46-47]', 'WANDB_API_KEY': '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', 'VSCODE_GIT_IPC_HANDLE': '/run/user/1005/vscode-git-21eb2adf6a.sock', 'ENVIRONMENT': 'BATCH', 'CONDA_SHLVL': '1', 'SLURM_SRUN_COMM_PORT': '33673', 'NODES': '4', 'EXP_NAME': 'midfine_base_final', 'LOADEDMODULES': '', 'TEMP': '/scratch/local/xun/tmp', 'SLURM_STEP_ID': '0', 'SLURM_PRIO_PROCESS': '0', 'SLURM_NPROCS': '4', 'SHLVL': '3', 'NVM_CD_FLAGS': '', 'SLURM_NNODES': '4', 'WANDB_MODE': 'online', 'HPCX_DIR': '/opt/hpcx', 'XDG_SESSION_ID': '1916', 'VIRTUAL_ENV_PROMPT': '(stem) ', 'TORCHINDUCTOR_COMPILE_THREADS': '32', 'SLURM_SUBMIT_HOST': 'login-node-0', 'CONDA_PYTHON_EXE': '/home/xun/anaconda3/bin/python', 'LD_LIBRARY_PATH': '/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'NCCL_IB_DISABLE': '0', 'XDG_RUNTIME_DIR': '/run/user/1005', 'SLURM_JOB_ID': '29546', 'SSL_CERT_FILE': '/usr/lib/ssl/certs/ca-certificates.crt', 'SLURM_NODEID': '0', 'PS1': '(stem) ', 'SLURM_STEP_NUM_NODES': '4', 'SSH_CLIENT': '67.163.187.8 64380 22', 'CONDA_DEFAULT_ENV': 'base', 'PYENV_ROOT': '/opt/pyenv', 'OPAL_PREFIX': '/opt/hpcx/ompi', 'OMP_NUM_THREADS': '1', 'OLD_LD_LIBRARY_PATH': '/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:/opt/hpcx/nccl_rdma_sharp_plugin/lib:/opt/hpcx/ucc/lib/ucc:/opt/hpcx/ucc/lib:/opt/hpcx/ucx/lib/ucx:/opt/hpcx/ucx/lib:/opt/hpcx/sharp/lib:/opt/hpcx/hcoll/lib:/opt/hpcx/ompi/lib:/usr/local/cuda/lib64:', 'SLURM_STEP_TASKS_PER_NODE': '1(x4)', 'WORLD_MODEL_LOG_LEVEL': 'DEBUG', 'VSCODE_GIT_ASKPASS_MAIN': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/extensions/git/dist/askpass-main.js', 'CUDA_HOME': '/usr/local/cuda-12.8', 'DATA_ROOT_DIR': '/home/xun/rsadhukh/STEM/data', 'XDG_DATA_DIRS': '/usr/local/share:/usr/share:/var/lib/snapd/desktop', 'NPROC_PER_NODE': '8', 'TORCH_FR_BUFFER_SIZE': '32', 'TMP': '/scratch/local/xun/tmp', 'BROWSER': '/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/helpers/browser.sh', 'SLURM_CONF': '/var/spool/slurmd/conf-cache/slurm.conf', 'PATH': '/home/xun/rsadhukh/STEM/stem/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/shims:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/home/xun/.local/bin:/opt/pyenv/bin:/home/xun/.cursor-server/cli/servers/Stable-3a67af7b780e0bfc8d32aefa96b8ff1cb8817f80/server/bin/remote-cli:/home/xun/.local/bin:/home/xun/bin:/home/xun/.nvm/versions/node/v22.22.2/bin:/home/xun/anaconda3/bin:/home/xun/anaconda3/condabin:/home/xun/.local/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/opt/pyenv/bin:/home/xun/.local/bin:/home/xun/bin:/opt/pyenv/bin:/opt/hpcx/sharp/bin:/opt/hpcx/clusterkit/bin:/opt/hpcx/hcoll/bin:/opt/hpcx/ucc/bin:/opt/hpcx/ucx/bin:/opt/hpcx/ompi/bin:/usr/local/cuda/bin:/opt/slurm/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin', 'HPCX_NCCL_RDMA_SHARP_PLUGIN_DIR': '/opt/hpcx/nccl_rdma_sharp_plugin', 'SLURM_JOB_NAME': 'stem', 'MODULEPATH': '/etc/environment-modules/modules:/usr/share/modules/versions:/usr/share/modules/$MODULE_VERSION/modulefiles:/usr/share/modules/modulefiles', 'SLURM_NTASKS_PER_NODE': '1', 'HPCX_MPI_TESTS_DIR': '/opt/hpcx/ompi/tests', 'DBUS_SESSION_BUS_ADDRESS': 'unix:path=/run/user/1005/bus', 'OLD_OPAL_PREFIX': '/opt/hpcx/ompi', 'NVM_BIN': '/home/xun/.nvm/versions/node/v22.22.2/bin', 'SLURM_STEP_LAUNCHER_PORT': '33673', 'OMPI_MCA_plm_slurm_args': '--external-launcher', 'SLURM_JOB_GID': '1005', 'CPATH': '/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:/opt/hpcx/ompi/include:/opt/hpcx/ucc/include:/opt/hpcx/ucx/include:/opt/hpcx/sharp/include:/opt/hpcx/hcoll/include:', 'HF_ALLOW_CODE_EVAL': '1', 'OVSX_REGISTRY_URL': 'https://open-vsx.org', 'OLDPWD': '/home/xun/rsadhukh/STEM', 'SLURM_JOB_NODELIST': 'compute-node-[3,7,46-47]', 'MODULES_CMD': '/usr/lib/x86_64-linux-gnu/modulecmd.tcl', 'TERM_PROGRAM': 'vscode', 'SLURM_OUTPUT_MODE': 'standard', 'VSCODE_IPC_HOOK_CLI': '/run/user/1005/vscode-ipc-6e7881a1-db52-4a0c-a6a0-9765d1799424.sock', 'I_MPI_HYDRA_BOOTSTRAP': 'slurm', 'BASH_FUNC_ml%%': '() { module ml "$@"\n}', 'BASH_FUNC_module%%': '() { eval `/usr/bin/tclsh8.6 /usr/lib/x86_64-linux-gnu/modulecmd.tcl bash "$@"`;\n _mlstatus=$?;\n return $_mlstatus\n}', '_': '/usr/bin/stdbuf', '_STDBUF_O': 'L', '_STDBUF_E': 'L', 'LD_PRELOAD': '/usr/libexec/coreutils/libstdbuf.so', 'LOCAL_RANK': '0', 'RANK': '0', 'GROUP_RANK': '0', 'ROLE_RANK': '0', 'ROLE_NAME': 'default', 'LOCAL_WORLD_SIZE': '8', 'GROUP_WORLD_SIZE': '4', 'ROLE_WORLD_SIZE': '32', 'TORCHELASTIC_RESTART_COUNT': '0', 'TORCHELASTIC_MAX_RESTARTS': '0', 'TORCHELASTIC_RUN_ID': 'none', 'TORCHELASTIC_USE_AGENT_STORE': 'True', 'TORCH_NCCL_ASYNC_ERROR_HANDLING': '1', 'TORCHELASTIC_ERROR_FILE': '/scratch/local/xun/tmp/torchelastic_opolicti/none_8o85yfdi/attempt_0/0/error.json', 'CUDA_MODULE_LOADING': 'LAZY', 'TORCHINDUCTOR_CACHE_DIR': '/scratch/local/xun/tmp/torchinductor_xun', 'KMP_DUPLICATE_LIB_OK': 'True', 'KMP_INIT_AT_FORK': 'FALSE', 'MKL_SERVICE_FORCE_INTEL': 'GNU', 'MKL_NUM_THREADS': '1', 'ENABLE_INTRA_NODE_COMM': '1', 'TORCH_NCCL_AVOID_RECORD_STREAMS': '1', 'NCCL_IB_TIMEOUT': '22', 'NCCL_DEBUG': 'INFO', 'TRITON_CACHE_DIR': '/scratch/local/xun/tmp/tmpfxgobe_y'}) 0: INFO 26-04-29 15:35:34.040042 - 0:00:14 - Starting job: olmo2_1B_midfine 0: INFO 26-04-29 15:35:34.040288 - 0:00:14 - Running on dp rank : 0 0: INFO 26-04-29 15:35:34.040357 - 0:00:14 - Running on dp size : 32 0: INFO 26-04-29 15:35:34.040404 - 0:00:14 - Using model type: olmo3 (OLMo3LMTransformer) 0: INFO 26-04-29 15:35:34.042348 - 0:00:14 - Building model 0: INFO 26-04-29 15:35:34.059424 - 0:00:14 - Model is built ! 0: WARNING 26-04-29 15:35:34.293994 - 0:00:15 - Model parameter layers.0.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.294669 - 0:00:15 - Model parameter layers.0.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.295227 - 0:00:15 - Model parameter layers.0.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.295606 - 0:00:15 - Model parameter layers.0.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.295887 - 0:00:15 - Model parameter layers.0.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.296149 - 0:00:15 - Model parameter layers.0.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.296455 - 0:00:15 - Model parameter layers.0.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.296763 - 0:00:15 - Model parameter layers.0.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.297051 - 0:00:15 - Model parameter layers.0.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.297321 - 0:00:15 - Model parameter layers.0.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.297601 - 0:00:15 - Model parameter layers.0.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.297894 - 0:00:15 - Model parameter layers.1.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.298266 - 0:00:15 - Model parameter layers.1.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.298607 - 0:00:15 - Model parameter layers.1.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.298916 - 0:00:15 - Model parameter layers.1.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.299199 - 0:00:15 - Model parameter layers.1.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.299479 - 0:00:15 - Model parameter layers.1.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.299776 - 0:00:15 - Model parameter layers.1.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.300058 - 0:00:15 - Model parameter layers.1.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.300352 - 0:00:15 - Model parameter layers.1.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.300628 - 0:00:15 - Model parameter layers.1.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.300885 - 0:00:15 - Model parameter layers.1.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.301163 - 0:00:15 - Model parameter layers.2.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.301461 - 0:00:15 - Model parameter layers.2.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.301746 - 0:00:15 - Model parameter layers.2.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.302021 - 0:00:15 - Model parameter layers.2.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.302276 - 0:00:15 - Model parameter layers.2.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.302559 - 0:00:15 - Model parameter layers.2.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.302884 - 0:00:15 - Model parameter layers.2.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.303214 - 0:00:15 - Model parameter layers.2.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.303614 - 0:00:15 - Model parameter layers.2.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.303929 - 0:00:15 - Model parameter layers.2.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.304193 - 0:00:15 - Model parameter layers.2.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.304505 - 0:00:15 - Model parameter layers.3.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.304797 - 0:00:15 - Model parameter layers.3.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.305080 - 0:00:15 - Model parameter layers.3.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.305370 - 0:00:15 - Model parameter layers.3.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.305639 - 0:00:15 - Model parameter layers.3.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.305904 - 0:00:15 - Model parameter layers.3.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.306183 - 0:00:15 - Model parameter layers.3.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.306489 - 0:00:15 - Model parameter layers.3.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.306786 - 0:00:15 - Model parameter layers.3.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.307078 - 0:00:15 - Model parameter layers.3.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.307354 - 0:00:15 - Model parameter layers.3.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.307656 - 0:00:15 - Model parameter layers.4.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.307935 - 0:00:15 - Model parameter layers.4.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.308208 - 0:00:15 - Model parameter layers.4.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.308510 - 0:00:15 - Model parameter layers.4.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.308782 - 0:00:15 - Model parameter layers.4.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.309038 - 0:00:15 - Model parameter layers.4.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.309327 - 0:00:15 - Model parameter layers.4.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.309623 - 0:00:15 - Model parameter layers.4.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.309901 - 0:00:15 - Model parameter layers.4.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.310154 - 0:00:15 - Model parameter layers.4.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.310433 - 0:00:15 - Model parameter layers.4.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.310729 - 0:00:15 - Model parameter layers.5.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.311042 - 0:00:15 - Model parameter layers.5.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.311344 - 0:00:15 - Model parameter layers.5.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.311634 - 0:00:15 - Model parameter layers.5.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.311893 - 0:00:15 - Model parameter layers.5.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.312148 - 0:00:15 - Model parameter layers.5.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.312451 - 0:00:15 - Model parameter layers.5.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.312744 - 0:00:15 - Model parameter layers.5.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.313024 - 0:00:15 - Model parameter layers.5.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.313287 - 0:00:15 - Model parameter layers.5.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.313570 - 0:00:15 - Model parameter layers.5.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.313861 - 0:00:15 - Model parameter layers.6.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.314154 - 0:00:15 - Model parameter layers.6.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.314455 - 0:00:15 - Model parameter layers.6.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.314750 - 0:00:15 - Model parameter layers.6.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.315037 - 0:00:15 - Model parameter layers.6.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.315319 - 0:00:15 - Model parameter layers.6.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.315627 - 0:00:15 - Model parameter layers.6.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.315915 - 0:00:15 - Model parameter layers.6.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.316200 - 0:00:15 - Model parameter layers.6.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.316472 - 0:00:15 - Model parameter layers.6.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.316744 - 0:00:15 - Model parameter layers.6.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.317032 - 0:00:15 - Model parameter layers.7.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.317322 - 0:00:15 - Model parameter layers.7.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.317620 - 0:00:15 - Model parameter layers.7.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.317898 - 0:00:15 - Model parameter layers.7.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.318155 - 0:00:15 - Model parameter layers.7.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.318424 - 0:00:15 - Model parameter layers.7.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.318715 - 0:00:15 - Model parameter layers.7.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.319024 - 0:00:15 - Model parameter layers.7.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.319325 - 0:00:15 - Model parameter layers.7.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.319614 - 0:00:15 - Model parameter layers.7.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.319873 - 0:00:15 - Model parameter layers.7.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.320153 - 0:00:15 - Model parameter layers.8.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.320455 - 0:00:15 - Model parameter layers.8.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.320748 - 0:00:15 - Model parameter layers.8.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.321026 - 0:00:15 - Model parameter layers.8.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.321281 - 0:00:15 - Model parameter layers.8.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.321561 - 0:00:15 - Model parameter layers.8.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.321844 - 0:00:15 - Model parameter layers.8.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.322123 - 0:00:15 - Model parameter layers.8.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.322411 - 0:00:15 - Model parameter layers.8.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.322683 - 0:00:15 - Model parameter layers.8.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.322962 - 0:00:15 - Model parameter layers.8.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.323257 - 0:00:15 - Model parameter layers.9.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.323568 - 0:00:15 - Model parameter layers.9.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.323854 - 0:00:15 - Model parameter layers.9.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.324135 - 0:00:15 - Model parameter layers.9.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.324405 - 0:00:15 - Model parameter layers.9.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.324709 - 0:00:15 - Model parameter layers.9.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.325001 - 0:00:15 - Model parameter layers.9.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.325284 - 0:00:15 - Model parameter layers.9.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.325587 - 0:00:15 - Model parameter layers.9.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.325852 - 0:00:15 - Model parameter layers.9.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.326102 - 0:00:15 - Model parameter layers.9.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.326394 - 0:00:15 - Model parameter layers.10.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.326686 - 0:00:15 - Model parameter layers.10.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.326991 - 0:00:15 - Model parameter layers.10.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.327292 - 0:00:15 - Model parameter layers.10.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.327590 - 0:00:15 - Model parameter layers.10.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.327872 - 0:00:15 - Model parameter layers.10.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.328167 - 0:00:15 - Model parameter layers.10.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.328462 - 0:00:15 - Model parameter layers.10.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.328757 - 0:00:15 - Model parameter layers.10.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.329012 - 0:00:15 - Model parameter layers.10.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.329263 - 0:00:15 - Model parameter layers.10.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.329577 - 0:00:15 - Model parameter layers.11.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.329856 - 0:00:15 - Model parameter layers.11.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.330129 - 0:00:15 - Model parameter layers.11.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.330415 - 0:00:15 - Model parameter layers.11.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.330683 - 0:00:15 - Model parameter layers.11.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.330973 - 0:00:15 - Model parameter layers.11.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.331269 - 0:00:15 - Model parameter layers.11.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.331575 - 0:00:15 - Model parameter layers.11.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.331862 - 0:00:15 - Model parameter layers.11.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.332117 - 0:00:15 - Model parameter layers.11.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.332389 - 0:00:15 - Model parameter layers.11.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.332694 - 0:00:15 - Model parameter layers.12.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.332978 - 0:00:15 - Model parameter layers.12.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.333266 - 0:00:15 - Model parameter layers.12.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.333572 - 0:00:15 - Model parameter layers.12.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.333832 - 0:00:15 - Model parameter layers.12.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.334084 - 0:00:15 - Model parameter layers.12.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.334381 - 0:00:15 - Model parameter layers.12.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.334680 - 0:00:15 - Model parameter layers.12.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.334989 - 0:00:15 - Model parameter layers.12.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.335259 - 0:00:15 - Model parameter layers.12.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.335545 - 0:00:15 - Model parameter layers.12.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.335842 - 0:00:15 - Model parameter layers.13.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.336114 - 0:00:15 - Model parameter layers.13.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.336404 - 0:00:15 - Model parameter layers.13.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.336703 - 0:00:15 - Model parameter layers.13.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.336964 - 0:00:15 - Model parameter layers.13.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.337215 - 0:00:15 - Model parameter layers.13.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.337509 - 0:00:15 - Model parameter layers.13.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.337799 - 0:00:15 - Model parameter layers.13.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.338075 - 0:00:15 - Model parameter layers.13.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.338345 - 0:00:15 - Model parameter layers.13.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.338614 - 0:00:15 - Model parameter layers.13.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.338922 - 0:00:15 - Model parameter layers.14.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.339215 - 0:00:15 - Model parameter layers.14.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.339509 - 0:00:15 - Model parameter layers.14.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.339803 - 0:00:15 - Model parameter layers.14.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.340060 - 0:00:15 - Model parameter layers.14.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.340318 - 0:00:15 - Model parameter layers.14.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.340615 - 0:00:15 - Model parameter layers.14.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.340894 - 0:00:15 - Model parameter layers.14.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.341181 - 0:00:15 - Model parameter layers.14.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.341449 - 0:00:15 - Model parameter layers.14.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.341715 - 0:00:15 - Model parameter layers.14.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.341995 - 0:00:15 - Model parameter layers.15.attention.wq.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.342279 - 0:00:15 - Model parameter layers.15.attention.wk.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.342578 - 0:00:15 - Model parameter layers.15.attention.wv.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.342875 - 0:00:15 - Model parameter layers.15.attention.wo.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.343153 - 0:00:15 - Model parameter layers.15.attention.q_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.343432 - 0:00:15 - Model parameter layers.15.attention.k_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.343726 - 0:00:15 - Model parameter layers.15.feed_forward.w1.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.344003 - 0:00:15 - Model parameter layers.15.feed_forward.w3.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.344282 - 0:00:15 - Model parameter layers.15.feed_forward.w2.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.344567 - 0:00:15 - Model parameter layers.15.post_attention_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.344827 - 0:00:15 - Model parameter layers.15.post_feedforward_norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.345550 - 0:00:15 - Model parameter tok_embeddings.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.345913 - 0:00:15 - Model parameter norm.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.346250 - 0:00:15 - Model parameter output.weight is all zeros: it might be because of a missing initialization 0: WARNING 26-04-29 15:35:34.346606 - 0:00:15 - Model parameter rope_embeddings.freqs_cis is all zeros: it might be because of a missing initialization 0: INFO 26-04-29 15:35:34.347163 - 0:00:15 - Model size: 1,484,916,736 total parameters 0: INFO 26-04-29 15:35:34.347658 - 0:00:15 - GPU capacity: NVIDIA H200 (0) with 139.80GiB memory 0: INFO 26-04-29 15:35:34.352227 - 0:00:15 - GPU memory usage: NVIDIA H200 (0): 139.80084228515625 GiB capacity, 0.208984375 GiB peak, 0.14948720736154641% peak 0: INFO 26-04-29 15:35:34.352355 - 0:00:15 - Starting build of optimizer... 0: INFO 26-04-29 15:35:34.353204 - 0:00:15 - Done with build of optimizer. 0: INFO 26-04-29 15:35:34.353280 - 0:00:15 - Using global DP dataloader sharding: rank 0/32 0: INFO 26-04-29 15:35:35.403910 - 0:00:16 - Loading initial model & optimizer from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ 0: INFO 26-04-29 15:35:49.113942 - 0:00:29 - Reloading train state 0: INFO 26-04-29 15:35:49.121886 - 0:00:29 - Train state reloaded 0: INFO 26-04-29 15:35:49.122031 - 0:00:29 - Loading from: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000 0: INFO 26-04-29 15:35:51.444052 - 0:00:32 - Model and optim reloaded 0: DEBUG 26-04-29 15:35:51.455160 - 0:00:32 - Using selector: EpollSelector 0: DEBUG 26-04-29 15:35:51.541434 - 0:00:32 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 15:35:51.555455 - 0:00:32 - Popen(['git', 'version'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 15:35:51.561572 - 0:00:32 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 15:35:51.564696 - 0:00:32 - Popen(['git', 'rev-parse', '--show-toplevel'], cwd=/home/xun/rsadhukh/STEM, stdin=None, shell=False, universal_newlines=False) 0: DEBUG 26-04-29 15:35:51.579538 - 0:00:32 - Starting new HTTPS connection (1): api.wandb.ai:443 0: DEBUG 26-04-29 15:35:52.105309 - 0:00:32 - https://api.wandb.ai:443 "POST /graphql HTTP/1.1" 200 None 0: DEBUG 26-04-29 15:35:52.410943 - 0:00:33 - sys.platform='linux', git_executable='git' 0: DEBUG 26-04-29 15:35:52.414397 - 0:00:33 - Popen(['git', 'cat-file', '--batch-check'], cwd=/home/xun/rsadhukh/STEM, stdin=, shell=False, universal_newlines=False) 0: INFO 26-04-29 15:35:54.077462 - 0:00:34 - Loading data loader... 0: WARNING 26-04-29 15:35:54.077966 - 0:00:34 - track_packed_source_mixture=True: source counts are updated in the dataloader process only; forcing synchronous dataloader (load_async=False) for this run. 0: INFO 26-04-29 15:35:54.078386 - 0:00:34 - Loaded data loader! 0: INFO 26-04-29 15:35:54.078598 - 0:00:34 - Profiling active. Traces will be saved at /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling 0: INFO 26-04-29 15:35:54.079180 - 0:00:34 - Created trace directory! 0: INFO 26-04-29 15:35:54.079531 - 0:00:34 - Waiting at profiler barrier... 0: INFO 26-04-29 15:35:54.080173 - 0:00:34 - Profiler barrier passed 0: INFO 26-04-29 15:35:55.186280 - 0:00:35 - Using vocab_size=100352 from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/config.json (tokenizer has 100278 tokens) 0: INFO 26-04-29 15:35:55.187710 - 0:00:35 - HuggingFace tokenizer loaded from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ – #words: 100352, BOS ID: 100257, EOS ID: 100257 0: INFO 26-04-29 15:38:12.874226 - 0:02:53 - garbage collection 0: INFO 26-04-29 15:38:26.356526 - 0:03:07 - step: 15010 acc: 0 loss: 1.7544 grad: 1.73e-01 flops: 3.71e+13 wps: 4.30e+03 iter: 0.6567 data: 0.092 lr: 5.21e-05 mem: 54% pow: 624.057 W 0: INFO 26-04-29 15:38:40.231436 - 0:03:21 - step: 15020 acc: 0 loss: 2.0393 grad: 1.64e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6291 data: 0.0742 lr: 5.21e-05 mem: 47% pow: 655.421 W 0: INFO 26-04-29 15:38:54.114997 - 0:03:34 - step: 15030 acc: 0 loss: 1.8195 grad: 1.62e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6587 data: 0.0858 lr: 5.20e-05 mem: 47% pow: 641.399 W 0: INFO 26-04-29 15:39:08.154111 - 0:03:48 - step: 15040 acc: 0 loss: 1.3898 grad: 1.76e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6631 data: 0.0835 lr: 5.20e-05 mem: 47% pow: 624.785 W 0: INFO 26-04-29 15:39:22.449570 - 0:04:03 - Starting MemSnapshotsProfilerWandb profiler... 0: INFO 26-04-29 15:39:22.452917 - 0:04:03 - step: 15050 acc: 0 loss: 1.5927 grad: 1.84e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5814 data: 0.1056 lr: 5.20e-05 mem: 47% pow: 667.811 W 0: INFO 26-04-29 15:39:23.991596 - 0:04:04 - Shutting down MemSnapshotsProfilerWandb profiler... 0: INFO 26-04-29 15:39:24.086053 - 0:04:04 - Starting PyTorchProfilerWandb profiler... 0: INFO 26-04-29 15:39:25.621165 - 0:04:06 - Shutting down PyTorchProfilerWandb profiler... 0: INFO 26-04-29 15:39:26.672852 - 0:04:07 - Begin analyze trace 0: INFO 26-04-29 15:39:27.107681 - 0:04:07 - End analyze trace 0: INFO 26-04-29 15:39:27.267969 - 0:04:08 - xFormers profiler done. summary: MemTrace : /home/xun/rsadhukh/STEM/logs/midfine_base_final/profiling/memory_trace_plot/000102_rank00_compute-node-3_470303.html Step time (ms): 644 TFlop/step : 273.5 TFlops : 424.0 HFU : 0.000 MFU : 0.000 0: INFO 26-04-29 15:39:38.243895 - 0:04:19 - step: 15060 acc: 0 loss: 1.61 grad: 1.81e-01 flops: 3.58e+14 wps: 4.15e+04 iter: 0.611 data: 0.0817 lr: 5.20e-05 mem: 47% pow: 664.714 W 0: INFO 26-04-29 15:39:52.318176 - 0:04:33 - step: 15070 acc: 0 loss: 1.7124 grad: 1.57e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6311 data: 0.0807 lr: 5.20e-05 mem: 47% pow: 638.193 W 0: INFO 26-04-29 15:40:05.953463 - 0:04:46 - step: 15080 acc: 0 loss: 1.857 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6169 data: 0.0698 lr: 5.20e-05 mem: 47% pow: 664.973 W 0: INFO 26-04-29 15:40:20.689150 - 0:05:01 - step: 15090 acc: 0 loss: 1.6562 grad: 1.69e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.7011 data: 0.0755 lr: 5.19e-05 mem: 47% pow: 600.99 W 0: INFO 26-04-29 15:40:34.709434 - 0:05:15 - step: 15100 acc: 0 loss: 1.6124 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5796 data: 0.1343 lr: 5.19e-05 mem: 47% pow: 644.235 W 0: INFO 26-04-29 15:40:51.870549 - 0:05:32 - step: 15110 acc: 0 loss: 1.5796 grad: 1.62e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.5979 data: 0.083 lr: 5.19e-05 mem: 54% pow: 659.533 W 0: INFO 26-04-29 15:41:05.596206 - 0:05:46 - step: 15120 acc: 0 loss: 1.7002 grad: 1.82e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6104 data: 0.0764 lr: 5.19e-05 mem: 47% pow: 663.154 W 0: INFO 26-04-29 15:41:19.407384 - 0:06:00 - step: 15130 acc: 0 loss: 1.6391 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6058 data: 0.1093 lr: 5.19e-05 mem: 47% pow: 649.178 W 0: INFO 26-04-29 15:41:33.092808 - 0:06:13 - step: 15140 acc: 0 loss: 2.0514 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6417 data: 0.0751 lr: 5.19e-05 mem: 47% pow: 641.672 W 0: INFO 26-04-29 15:41:46.784335 - 0:06:27 - step: 15150 acc: 0 loss: 1.4658 grad: 1.74e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6007 data: 0.0927 lr: 5.19e-05 mem: 47% pow: 655.412 W 0: INFO 26-04-29 15:42:00.655942 - 0:06:41 - step: 15160 acc: 0 loss: 1.6834 grad: 1.60e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6652 data: 0.0776 lr: 5.18e-05 mem: 47% pow: 638.447 W 0: INFO 26-04-29 15:42:14.553483 - 0:06:55 - step: 15170 acc: 0 loss: 1.4094 grad: 1.63e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5827 data: 0.115 lr: 5.18e-05 mem: 47% pow: 645.626 W 0: INFO 26-04-29 15:42:28.478528 - 0:07:09 - step: 15180 acc: 0 loss: 1.666 grad: 1.70e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6251 data: 0.062 lr: 5.18e-05 mem: 47% pow: 663.605 W 0: INFO 26-04-29 15:42:42.144723 - 0:07:22 - step: 15190 acc: 0 loss: 1.8854 grad: 1.59e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5982 data: 0.0769 lr: 5.18e-05 mem: 47% pow: 666.88 W 0: INFO 26-04-29 15:42:56.034627 - 0:07:36 - step: 15200 acc: 0 loss: 1.9074 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5932 data: 0.0903 lr: 5.18e-05 mem: 47% pow: 656.932 W 0: INFO 26-04-29 15:43:12.791714 - 0:07:53 - step: 15210 acc: 0 loss: 1.5734 grad: 1.64e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6221 data: 0.0806 lr: 5.18e-05 mem: 54% pow: 648.437 W 0: INFO 26-04-29 15:43:26.724032 - 0:08:07 - step: 15220 acc: 0 loss: 1.9295 grad: 1.68e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6696 data: 0.0263 lr: 5.18e-05 mem: 47% pow: 649.785 W 0: INFO 26-04-29 15:43:40.964697 - 0:08:21 - step: 15230 acc: 0 loss: 1.5902 grad: 1.61e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6262 data: 0.0805 lr: 5.17e-05 mem: 47% pow: 649.591 W 0: INFO 26-04-29 15:43:54.788617 - 0:08:35 - step: 15240 acc: 0 loss: 1.8119 grad: 1.60e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6177 data: 0.0818 lr: 5.17e-05 mem: 47% pow: 646.426 W 0: INFO 26-04-29 15:44:08.371099 - 0:08:49 - step: 15250 acc: 0 loss: 1.5334 grad: 1.65e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5925 data: 0.0867 lr: 5.17e-05 mem: 47% pow: 666.642 W 0: INFO 26-04-29 15:44:22.342321 - 0:09:03 - step: 15260 acc: 0 loss: 1.8017 grad: 1.64e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5938 data: 0.0798 lr: 5.17e-05 mem: 47% pow: 668.351 W 0: INFO 26-04-29 15:44:36.257238 - 0:09:17 - step: 15270 acc: 0 loss: 1.8151 grad: 6.78e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5938 data: 0.0952 lr: 5.17e-05 mem: 47% pow: 648.589 W 0: INFO 26-04-29 15:44:50.099204 - 0:09:30 - step: 15280 acc: 0 loss: 1.812 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5848 data: 0.0865 lr: 5.17e-05 mem: 47% pow: 664.179 W 0: INFO 26-04-29 15:45:04.134813 - 0:09:44 - step: 15290 acc: 0 loss: 1.8994 grad: 1.62e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.581 data: 0.4665 lr: 5.16e-05 mem: 47% pow: 460.383 W 0: INFO 26-04-29 15:45:17.889827 - 0:09:58 - step: 15300 acc: 0 loss: 1.8056 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6171 data: 0.077 lr: 5.16e-05 mem: 47% pow: 657.976 W 0: INFO 26-04-29 15:45:34.858385 - 0:10:15 - step: 15310 acc: 0 loss: 2.1491 grad: 1.61e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.5882 data: 0.0817 lr: 5.16e-05 mem: 54% pow: 671.637 W 0: INFO 26-04-29 15:45:48.898777 - 0:10:29 - step: 15320 acc: 0 loss: 1.8461 grad: 1.70e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5905 data: 0.0922 lr: 5.16e-05 mem: 47% pow: 660.738 W 0: INFO 26-04-29 15:46:02.809954 - 0:10:43 - step: 15330 acc: 0 loss: 1.7709 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6044 data: 0.0696 lr: 5.16e-05 mem: 47% pow: 659.876 W 0: INFO 26-04-29 15:46:16.725640 - 0:10:57 - step: 15340 acc: 0 loss: 1.6191 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7124 data: 0.0455 lr: 5.16e-05 mem: 47% pow: 613.269 W 0: INFO 26-04-29 15:46:30.610311 - 0:11:11 - step: 15350 acc: 0 loss: 1.309 grad: 1.74e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7029 data: 0.0669 lr: 5.16e-05 mem: 47% pow: 615.725 W 0: INFO 26-04-29 15:46:44.355468 - 0:11:25 - step: 15360 acc: 0 loss: 2.0956 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6054 data: 0.0818 lr: 5.15e-05 mem: 47% pow: 662.3 W 0: INFO 26-04-29 15:46:58.582319 - 0:11:39 - step: 15370 acc: 0 loss: 1.7239 grad: 1.60e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6052 data: 0.0833 lr: 5.15e-05 mem: 47% pow: 661.275 W 0: INFO 26-04-29 15:47:12.662633 - 0:11:53 - step: 15380 acc: 0 loss: 1.6802 grad: 1.54e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6095 data: 0.0843 lr: 5.15e-05 mem: 47% pow: 651.719 W 0: INFO 26-04-29 15:47:26.634883 - 0:12:07 - step: 15390 acc: 0 loss: 1.8967 grad: 1.55e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6067 data: 0.0755 lr: 5.15e-05 mem: 47% pow: 655.309 W 0: INFO 26-04-29 15:47:40.843478 - 0:12:21 - step: 15400 acc: 0 loss: 1.6507 grad: 1.53e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6318 data: 0.0987 lr: 5.15e-05 mem: 47% pow: 631.368 W 0: INFO 26-04-29 15:47:57.308026 - 0:12:38 - step: 15410 acc: 0 loss: 1.616 grad: 1.51e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.631 data: 0.0767 lr: 5.15e-05 mem: 54% pow: 650.142 W 0: INFO 26-04-29 15:48:11.048298 - 0:12:51 - step: 15420 acc: 0 loss: 1.7769 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.61 data: 0.0869 lr: 5.15e-05 mem: 47% pow: 647.877 W 0: INFO 26-04-29 15:48:25.063592 - 0:13:05 - step: 15430 acc: 0 loss: 1.6401 grad: 1.60e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6638 data: 0.0695 lr: 5.14e-05 mem: 47% pow: 628.408 W 0: INFO 26-04-29 15:48:39.010889 - 0:13:19 - step: 15440 acc: 0 loss: 1.5587 grad: 1.61e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6807 data: 0.0749 lr: 5.14e-05 mem: 47% pow: 610.388 W 0: INFO 26-04-29 15:48:53.307805 - 0:13:34 - step: 15450 acc: 0 loss: 1.87 grad: 1.53e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.596 data: 0.0844 lr: 5.14e-05 mem: 47% pow: 666.632 W 0: INFO 26-04-29 15:49:06.821518 - 0:13:47 - step: 15460 acc: 0 loss: 1.8086 grad: 1.64e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6583 data: 0.0743 lr: 5.14e-05 mem: 47% pow: 639.611 W 0: INFO 26-04-29 15:49:20.557910 - 0:14:01 - step: 15470 acc: 0 loss: 1.7345 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6108 data: 0.0755 lr: 5.14e-05 mem: 47% pow: 663.494 W 0: INFO 26-04-29 15:49:34.565716 - 0:14:15 - step: 15480 acc: 0 loss: 1.3889 grad: 1.60e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6384 data: 0.0929 lr: 5.14e-05 mem: 47% pow: 632.038 W 0: INFO 26-04-29 15:49:48.361689 - 0:14:29 - step: 15490 acc: 0 loss: 2.0006 grad: 1.56e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6505 data: 0.0728 lr: 5.14e-05 mem: 47% pow: 644.344 W 0: INFO 26-04-29 15:50:02.546705 - 0:14:43 - step: 15500 acc: 0 loss: 1.2486 grad: 1.59e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6591 data: 0.0705 lr: 5.13e-05 mem: 47% pow: 636.431 W 0: INFO 26-04-29 15:50:19.390120 - 0:15:00 - step: 15510 acc: 0 loss: 1.9995 grad: 1.80e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6461 data: 0.0874 lr: 5.13e-05 mem: 54% pow: 626.768 W 0: INFO 26-04-29 15:50:33.513907 - 0:15:14 - step: 15520 acc: 0 loss: 1.7361 grad: 1.50e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6284 data: 0.0769 lr: 5.13e-05 mem: 47% pow: 648.288 W 0: INFO 26-04-29 15:50:47.204965 - 0:15:28 - step: 15530 acc: 0 loss: 1.7893 grad: 1.68e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6268 data: 0.0502 lr: 5.13e-05 mem: 47% pow: 655.839 W 0: INFO 26-04-29 15:51:01.085564 - 0:15:41 - step: 15540 acc: 0 loss: 1.4576 grad: 1.66e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5951 data: 0.0773 lr: 5.13e-05 mem: 47% pow: 661.187 W 0: INFO 26-04-29 15:51:14.686000 - 0:15:55 - step: 15550 acc: 0 loss: 1.4634 grad: 1.71e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5993 data: 0.0966 lr: 5.13e-05 mem: 47% pow: 646.379 W 0: INFO 26-04-29 15:51:28.970790 - 0:16:09 - step: 15560 acc: 0 loss: 1.7787 grad: 1.63e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6164 data: 0.0845 lr: 5.12e-05 mem: 47% pow: 652.094 W 0: INFO 26-04-29 15:51:43.018512 - 0:16:23 - step: 15570 acc: 0 loss: 1.6788 grad: 1.60e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6305 data: 0.0479 lr: 5.12e-05 mem: 47% pow: 656.947 W 0: INFO 26-04-29 15:51:56.715226 - 0:16:37 - step: 15580 acc: 0 loss: 1.8861 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6329 data: 0.0878 lr: 5.12e-05 mem: 47% pow: 639.882 W 0: INFO 26-04-29 15:52:10.598575 - 0:16:51 - step: 15590 acc: 0 loss: 1.8897 grad: 1.47e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5934 data: 0.0873 lr: 5.12e-05 mem: 47% pow: 659.113 W 0: INFO 26-04-29 15:52:24.537033 - 0:17:05 - step: 15600 acc: 0 loss: 1.7583 grad: 1.66e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6463 data: 0.0378 lr: 5.12e-05 mem: 47% pow: 660.426 W 0: INFO 26-04-29 15:52:41.233201 - 0:17:22 - step: 15610 acc: 0 loss: 1.8232 grad: 1.67e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6474 data: 0.055 lr: 5.12e-05 mem: 54% pow: 644.525 W 0: INFO 26-04-29 15:52:55.816230 - 0:17:36 - step: 15620 acc: 0 loss: 1.8624 grad: 1.55e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.6116 data: 0.0929 lr: 5.12e-05 mem: 47% pow: 654.303 W 0: INFO 26-04-29 15:53:09.944953 - 0:17:50 - step: 15630 acc: 0 loss: 1.8764 grad: 1.62e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5789 data: 0.0926 lr: 5.11e-05 mem: 47% pow: 663.214 W 0: INFO 26-04-29 15:53:23.512509 - 0:18:04 - step: 15640 acc: 0 loss: 1.8782 grad: 1.66e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.653 data: 0.072 lr: 5.11e-05 mem: 47% pow: 647.844 W 0: INFO 26-04-29 15:53:37.306180 - 0:18:18 - step: 15650 acc: 0 loss: 1.7386 grad: 1.56e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.619 data: 0.0717 lr: 5.11e-05 mem: 47% pow: 666.723 W 0: INFO 26-04-29 15:53:51.004767 - 0:18:31 - step: 15660 acc: 0 loss: 1.465 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6404 data: 0.1015 lr: 5.11e-05 mem: 47% pow: 625.749 W 0: INFO 26-04-29 15:54:04.986218 - 0:18:45 - step: 15670 acc: 0 loss: 1.9191 grad: 1.64e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5963 data: 0.0792 lr: 5.11e-05 mem: 47% pow: 659.277 W 0: INFO 26-04-29 15:54:18.725970 - 0:18:59 - step: 15680 acc: 0 loss: 1.7087 grad: 1.58e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6451 data: 0.0776 lr: 5.11e-05 mem: 47% pow: 637.839 W 0: INFO 26-04-29 15:54:32.483788 - 0:19:13 - step: 15690 acc: 0 loss: 1.6826 grad: 1.67e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6034 data: 0.0909 lr: 5.11e-05 mem: 47% pow: 651.435 W 0: INFO 26-04-29 15:54:46.509753 - 0:19:27 - step: 15700 acc: 0 loss: 1.3493 grad: 1.64e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5905 data: 0.0879 lr: 5.10e-05 mem: 47% pow: 660.745 W 0: INFO 26-04-29 15:55:03.403062 - 0:19:44 - step: 15710 acc: 0 loss: 1.6688 grad: 1.61e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6037 data: 0.0892 lr: 5.10e-05 mem: 54% pow: 653.431 W 0: INFO 26-04-29 15:55:17.358088 - 0:19:58 - step: 15720 acc: 0 loss: 1.8794 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6684 data: 0.0996 lr: 5.10e-05 mem: 47% pow: 612.081 W 0: INFO 26-04-29 15:55:31.254291 - 0:20:12 - step: 15730 acc: 0 loss: 1.6606 grad: 1.63e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.595 data: 0.0892 lr: 5.10e-05 mem: 47% pow: 664.629 W 0: INFO 26-04-29 15:55:45.006013 - 0:20:25 - step: 15740 acc: 0 loss: 1.8582 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6123 data: 0.0807 lr: 5.10e-05 mem: 47% pow: 654.84 W 0: INFO 26-04-29 15:55:58.876159 - 0:20:39 - step: 15750 acc: 0 loss: 1.7396 grad: 1.58e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.61 data: 0.0756 lr: 5.10e-05 mem: 47% pow: 666.794 W 0: INFO 26-04-29 15:56:12.909083 - 0:20:53 - step: 15760 acc: 0 loss: 1.941 grad: 1.51e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6747 data: 0.0728 lr: 5.10e-05 mem: 47% pow: 631.295 W 0: INFO 26-04-29 15:56:26.588492 - 0:21:07 - step: 15770 acc: 0 loss: 1.6064 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6561 data: 0.0931 lr: 5.09e-05 mem: 47% pow: 624.529 W 0: INFO 26-04-29 15:56:40.837756 - 0:21:21 - step: 15780 acc: 0 loss: 1.5853 grad: 1.54e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6265 data: 0.0805 lr: 5.09e-05 mem: 47% pow: 652.898 W 0: INFO 26-04-29 15:56:55.065450 - 0:21:35 - step: 15790 acc: 0 loss: 1.6288 grad: 1.54e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.582 data: 0.1066 lr: 5.09e-05 mem: 47% pow: 664.255 W 0: INFO 26-04-29 15:57:08.943325 - 0:21:49 - step: 15800 acc: 0 loss: 1.6228 grad: 1.61e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5904 data: 0.083 lr: 5.09e-05 mem: 47% pow: 664.224 W 0: INFO 26-04-29 15:57:25.637320 - 0:22:06 - step: 15810 acc: 0 loss: 1.6049 grad: 1.81e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.5903 data: 0.0785 lr: 5.09e-05 mem: 54% pow: 673.266 W 0: INFO 26-04-29 15:57:39.377428 - 0:22:20 - step: 15820 acc: 0 loss: 1.3597 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.612 data: 0.0942 lr: 5.09e-05 mem: 47% pow: 647.192 W 0: INFO 26-04-29 15:57:53.190915 - 0:22:33 - step: 15830 acc: 0 loss: 2.0514 grad: 1.60e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6273 data: 0.0834 lr: 5.08e-05 mem: 47% pow: 650.431 W 0: INFO 26-04-29 15:58:07.134358 - 0:22:47 - step: 15840 acc: 0 loss: 1.9605 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5953 data: 0.0877 lr: 5.08e-05 mem: 47% pow: 665.238 W 0: INFO 26-04-29 15:58:21.354469 - 0:23:02 - step: 15850 acc: 0 loss: 1.7467 grad: 1.51e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6531 data: 0.0433 lr: 5.08e-05 mem: 47% pow: 648.124 W 0: INFO 26-04-29 15:58:34.970295 - 0:23:15 - step: 15860 acc: 0 loss: 1.6166 grad: 1.56e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6046 data: 0.0863 lr: 5.08e-05 mem: 47% pow: 671.406 W 0: INFO 26-04-29 15:58:48.618357 - 0:23:29 - step: 15870 acc: 0 loss: 1.6663 grad: 1.64e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5801 data: 0.1097 lr: 5.08e-05 mem: 47% pow: 659.371 W 0: INFO 26-04-29 15:59:02.594500 - 0:23:43 - step: 15880 acc: 0 loss: 1.5164 grad: 1.65e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6051 data: 0.0933 lr: 5.08e-05 mem: 47% pow: 644.19 W 0: INFO 26-04-29 15:59:17.649277 - 0:23:58 - step: 15890 acc: 0 loss: 1.6103 grad: 1.60e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.6619 data: 0.075 lr: 5.08e-05 mem: 47% pow: 624.945 W 0: INFO 26-04-29 15:59:31.672382 - 0:24:12 - step: 15900 acc: 0 loss: 2.06 grad: 1.57e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.618 data: 0.074 lr: 5.07e-05 mem: 47% pow: 654.223 W 0: INFO 26-04-29 15:59:48.717916 - 0:24:29 - step: 15910 acc: 0 loss: 1.7026 grad: 1.59e-01 flops: 3.31e+14 wps: 3.85e+04 iter: 0.623 data: 0.0836 lr: 5.07e-05 mem: 54% pow: 651.264 W 0: INFO 26-04-29 16:00:02.354237 - 0:24:43 - step: 15920 acc: 0 loss: 1.9357 grad: 1.53e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6454 data: 0.0812 lr: 5.07e-05 mem: 47% pow: 634.06 W 0: INFO 26-04-29 16:00:15.957674 - 0:24:56 - step: 15930 acc: 0 loss: 1.7362 grad: 1.66e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5928 data: 0.0942 lr: 5.07e-05 mem: 47% pow: 660.713 W 0: INFO 26-04-29 16:00:29.517885 - 0:25:10 - step: 15940 acc: 0 loss: 1.8271 grad: 1.49e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6426 data: 0.076 lr: 5.07e-05 mem: 47% pow: 652.028 W 0: INFO 26-04-29 16:00:43.429451 - 0:25:24 - step: 15950 acc: 0 loss: 1.8346 grad: 1.56e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6186 data: 0.072 lr: 5.07e-05 mem: 47% pow: 661.826 W 0: INFO 26-04-29 16:00:57.111533 - 0:25:37 - step: 15960 acc: 0 loss: 1.7204 grad: 1.60e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.593 data: 0.0882 lr: 5.07e-05 mem: 47% pow: 658.535 W 0: INFO 26-04-29 16:01:11.197423 - 0:25:51 - step: 15970 acc: 0 loss: 1.4689 grad: 1.49e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5799 data: 0.101 lr: 5.06e-05 mem: 47% pow: 656.253 W 0: INFO 26-04-29 16:01:24.902683 - 0:26:05 - step: 15980 acc: 0 loss: 1.7505 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6644 data: 0.0857 lr: 5.06e-05 mem: 47% pow: 628.184 W 0: INFO 26-04-29 16:01:38.482975 - 0:26:19 - step: 15990 acc: 0 loss: 1.8442 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5989 data: 0.0834 lr: 5.06e-05 mem: 47% pow: 667.216 W 0: INFO 26-04-29 16:01:52.164864 - 0:26:32 - step: 16000 acc: 0 loss: 1.6132 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5859 data: 0.0885 lr: 5.06e-05 mem: 47% pow: 661.811 W 0: INFO 26-04-29 16:01:55.915236 - 0:26:36 - garbage collection 0: INFO 26-04-29 16:02:10.444402 - 0:26:51 - step: 16010 acc: 0 loss: 1.7279 grad: 1.48e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.6679 data: 0.0869 lr: 5.06e-05 mem: 54% pow: 613.304 W 0: INFO 26-04-29 16:02:24.565752 - 0:27:05 - step: 16020 acc: 0 loss: 1.7825 grad: 1.61e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6076 data: 0.0816 lr: 5.06e-05 mem: 47% pow: 654.01 W 0: INFO 26-04-29 16:02:38.772762 - 0:27:19 - step: 16030 acc: 0 loss: 1.6102 grad: 1.83e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.655 data: 0.0856 lr: 5.05e-05 mem: 47% pow: 635.416 W 0: INFO 26-04-29 16:02:52.854516 - 0:27:33 - step: 16040 acc: 0 loss: 1.7001 grad: 1.48e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6299 data: 0.0668 lr: 5.05e-05 mem: 47% pow: 668.662 W 0: INFO 26-04-29 16:03:07.018256 - 0:27:47 - step: 16050 acc: 0 loss: 1.6741 grad: 1.63e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5998 data: 0.0906 lr: 5.05e-05 mem: 47% pow: 650.596 W 0: INFO 26-04-29 16:03:21.048077 - 0:28:01 - step: 16060 acc: 0 loss: 2.0061 grad: 1.53e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6218 data: 0.0899 lr: 5.05e-05 mem: 47% pow: 637.829 W 0: INFO 26-04-29 16:03:34.741505 - 0:28:15 - step: 16070 acc: 0 loss: 1.62 grad: 1.61e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6201 data: 0.0686 lr: 5.05e-05 mem: 47% pow: 661.741 W 0: INFO 26-04-29 16:03:48.757645 - 0:28:29 - step: 16080 acc: 0 loss: 1.0676 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.665 data: 0.0899 lr: 5.05e-05 mem: 47% pow: 613.441 W 0: INFO 26-04-29 16:04:02.704426 - 0:28:43 - step: 16090 acc: 0 loss: 1.3778 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5783 data: 0.1138 lr: 5.05e-05 mem: 47% pow: 658.769 W 0: INFO 26-04-29 16:04:16.714206 - 0:28:57 - step: 16100 acc: 0 loss: 1.7184 grad: 1.62e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6412 data: 0.0749 lr: 5.04e-05 mem: 47% pow: 637.247 W 0: INFO 26-04-29 16:04:33.705744 - 0:29:14 - step: 16110 acc: 0 loss: 1.476 grad: 1.49e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.65 data: 0.0831 lr: 5.04e-05 mem: 54% pow: 632.944 W 0: INFO 26-04-29 16:04:47.468075 - 0:29:28 - step: 16120 acc: 0 loss: 1.6927 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5929 data: 0.104 lr: 5.04e-05 mem: 47% pow: 642.01 W 0: INFO 26-04-29 16:05:01.675618 - 0:29:42 - step: 16130 acc: 0 loss: 1.5211 grad: 1.50e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6178 data: 0.0935 lr: 5.04e-05 mem: 47% pow: 640.908 W 0: INFO 26-04-29 16:05:15.818759 - 0:29:56 - step: 16140 acc: 0 loss: 1.7467 grad: 1.58e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5958 data: 0.0908 lr: 5.04e-05 mem: 47% pow: 659.852 W 0: INFO 26-04-29 16:05:30.245841 - 0:30:11 - step: 16150 acc: 0 loss: 1.8004 grad: 1.55e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.887 data: 0.0824 lr: 5.04e-05 mem: 47% pow: 499.947 W 0: INFO 26-04-29 16:05:44.409184 - 0:30:25 - step: 16160 acc: 0 loss: 1.5798 grad: 1.62e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6016 data: 0.09 lr: 5.04e-05 mem: 47% pow: 657.634 W 0: INFO 26-04-29 16:05:58.211636 - 0:30:39 - step: 16170 acc: 0 loss: 1.7332 grad: 3.26e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.618 data: 0.0944 lr: 5.03e-05 mem: 47% pow: 646.887 W 0: INFO 26-04-29 16:06:12.419466 - 0:30:53 - step: 16180 acc: 0 loss: 1.8032 grad: 1.54e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6421 data: 0.0845 lr: 5.03e-05 mem: 47% pow: 638.499 W 0: INFO 26-04-29 16:06:26.006148 - 0:31:06 - step: 16190 acc: 0 loss: 1.5615 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5963 data: 0.1097 lr: 5.03e-05 mem: 47% pow: 660.775 W 0: INFO 26-04-29 16:06:40.018311 - 0:31:20 - step: 16200 acc: 0 loss: 1.67 grad: 1.70e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6118 data: 0.0835 lr: 5.03e-05 mem: 47% pow: 646.71 W 0: INFO 26-04-29 16:06:57.524850 - 0:31:38 - step: 16210 acc: 0 loss: 1.5291 grad: 1.65e-01 flops: 3.23e+14 wps: 3.74e+04 iter: 0.6082 data: 0.0832 lr: 5.03e-05 mem: 54% pow: 659.531 W 0: INFO 26-04-29 16:07:11.959686 - 0:31:52 - step: 16220 acc: 0 loss: 1.6022 grad: 1.50e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.5784 data: 0.3059 lr: 5.03e-05 mem: 47% pow: 546.079 W 0: INFO 26-04-29 16:07:25.913563 - 0:32:06 - step: 16230 acc: 0 loss: 1.7475 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6321 data: 0.0697 lr: 5.03e-05 mem: 47% pow: 658.932 W 0: INFO 26-04-29 16:07:40.229894 - 0:32:21 - step: 16240 acc: 0 loss: 2.0368 grad: 1.50e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5755 data: 0.1149 lr: 5.02e-05 mem: 47% pow: 646.979 W 0: INFO 26-04-29 16:07:54.409115 - 0:32:35 - step: 16250 acc: 0 loss: 1.7282 grad: 1.67e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.577 data: 0.1182 lr: 5.02e-05 mem: 47% pow: 657.416 W 0: INFO 26-04-29 16:08:08.607467 - 0:32:49 - step: 16260 acc: 0 loss: 1.5818 grad: 1.55e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5959 data: 0.0881 lr: 5.02e-05 mem: 47% pow: 655.91 W 0: INFO 26-04-29 16:08:22.786954 - 0:33:03 - step: 16270 acc: 0 loss: 1.8252 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6572 data: 0.0923 lr: 5.02e-05 mem: 47% pow: 634.645 W 0: INFO 26-04-29 16:08:37.098461 - 0:33:17 - step: 16280 acc: 0 loss: 1.8322 grad: 1.57e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.8562 data: 0.0774 lr: 5.02e-05 mem: 47% pow: 518.115 W 0: INFO 26-04-29 16:08:51.012674 - 0:33:31 - step: 16290 acc: 0 loss: 1.5602 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5777 data: 0.0959 lr: 5.02e-05 mem: 47% pow: 655.637 W 0: INFO 26-04-29 16:09:05.177628 - 0:33:45 - step: 16300 acc: 0 loss: 1.7773 grad: 1.62e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.619 data: 0.0863 lr: 5.01e-05 mem: 47% pow: 645.597 W 0: INFO 26-04-29 16:09:21.917595 - 0:34:02 - step: 16310 acc: 0 loss: 1.7439 grad: 1.74e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6163 data: 0.0862 lr: 5.01e-05 mem: 54% pow: 645.752 W 0: INFO 26-04-29 16:09:35.743242 - 0:34:16 - step: 16320 acc: 0 loss: 1.5697 grad: 1.67e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6056 data: 0.0849 lr: 5.01e-05 mem: 47% pow: 656.755 W 0: INFO 26-04-29 16:09:49.773618 - 0:34:30 - step: 16330 acc: 0 loss: 1.8684 grad: 1.72e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6159 data: 0.0615 lr: 5.01e-05 mem: 47% pow: 671.61 W 0: INFO 26-04-29 16:10:03.986547 - 0:34:44 - step: 16340 acc: 0 loss: 1.8666 grad: 1.61e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.5955 data: 0.0974 lr: 5.01e-05 mem: 47% pow: 648.767 W 0: INFO 26-04-29 16:10:17.940100 - 0:34:58 - step: 16350 acc: 0 loss: 1.9307 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6179 data: 0.092 lr: 5.01e-05 mem: 47% pow: 656.907 W 0: INFO 26-04-29 16:10:32.052206 - 0:35:12 - step: 16360 acc: 0 loss: 1.7571 grad: 1.54e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6196 data: 0.0828 lr: 5.01e-05 mem: 47% pow: 648.443 W 0: INFO 26-04-29 16:10:46.028685 - 0:35:26 - step: 16370 acc: 0 loss: 1.8745 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6295 data: 0.0751 lr: 5.00e-05 mem: 47% pow: 650.2 W 0: INFO 26-04-29 16:10:59.970196 - 0:35:40 - step: 16380 acc: 0 loss: 1.6527 grad: 1.60e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6392 data: 0.0545 lr: 5.00e-05 mem: 47% pow: 654.878 W 0: INFO 26-04-29 16:11:13.981619 - 0:35:54 - step: 16390 acc: 0 loss: 1.472 grad: 1.57e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.58 data: 0.0913 lr: 5.00e-05 mem: 47% pow: 681.573 W 0: INFO 26-04-29 16:11:27.799287 - 0:36:08 - step: 16400 acc: 0 loss: 1.5599 grad: 1.51e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6456 data: 0.0968 lr: 5.00e-05 mem: 47% pow: 630.881 W 0: INFO 26-04-29 16:11:44.712672 - 0:36:25 - step: 16410 acc: 0 loss: 1.7112 grad: 1.62e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.7299 data: 0.0886 lr: 5.00e-05 mem: 54% pow: 577.562 W 0: INFO 26-04-29 16:11:58.795076 - 0:36:39 - step: 16420 acc: 0 loss: 1.5362 grad: 1.52e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5989 data: 0.0821 lr: 5.00e-05 mem: 47% pow: 663.54 W 0: INFO 26-04-29 16:12:12.611253 - 0:36:53 - step: 16430 acc: 0 loss: 1.4526 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6616 data: 0.0904 lr: 5.00e-05 mem: 47% pow: 619.551 W 0: INFO 26-04-29 16:12:26.819854 - 0:37:07 - step: 16440 acc: 0 loss: 1.8333 grad: 1.54e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7642 data: 0.0874 lr: 4.99e-05 mem: 47% pow: 570.385 W 0: INFO 26-04-29 16:12:40.771469 - 0:37:21 - step: 16450 acc: 0 loss: 1.643 grad: 1.82e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6387 data: 0.0745 lr: 4.99e-05 mem: 47% pow: 638.635 W 0: INFO 26-04-29 16:12:54.744263 - 0:37:35 - step: 16460 acc: 0 loss: 1.432 grad: 1.88e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.605 data: 0.0819 lr: 4.99e-05 mem: 47% pow: 663.468 W 0: INFO 26-04-29 16:13:08.885522 - 0:37:49 - step: 16470 acc: 0 loss: 1.5351 grad: 1.76e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6007 data: 0.0906 lr: 4.99e-05 mem: 47% pow: 657.311 W 0: INFO 26-04-29 16:13:22.872927 - 0:38:03 - step: 16480 acc: 0 loss: 1.4334 grad: 1.67e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5969 data: 0.0829 lr: 4.99e-05 mem: 47% pow: 661.249 W 0: INFO 26-04-29 16:13:36.586027 - 0:38:17 - step: 16490 acc: 0 loss: 1.5629 grad: 1.73e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6051 data: 0.0858 lr: 4.99e-05 mem: 47% pow: 652.106 W 0: INFO 26-04-29 16:13:50.731020 - 0:38:31 - step: 16500 acc: 0 loss: 1.8844 grad: 1.56e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6715 data: 0.0037 lr: 4.98e-05 mem: 47% pow: 662.562 W 0: INFO 26-04-29 16:14:07.521883 - 0:38:48 - step: 16510 acc: 0 loss: 1.7798 grad: 1.48e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6188 data: 0.0888 lr: 4.98e-05 mem: 54% pow: 642.662 W 0: INFO 26-04-29 16:14:21.631015 - 0:39:02 - step: 16520 acc: 0 loss: 1.3718 grad: 1.53e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6442 data: 0.0868 lr: 4.98e-05 mem: 47% pow: 631.675 W 0: INFO 26-04-29 16:14:35.574119 - 0:39:16 - step: 16530 acc: 0 loss: 2.2895 grad: 1.68e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6012 data: 0.0911 lr: 4.98e-05 mem: 47% pow: 653.736 W 0: INFO 26-04-29 16:14:49.730116 - 0:39:30 - step: 16540 acc: 0 loss: 1.4851 grad: 1.57e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6021 data: 0.0913 lr: 4.98e-05 mem: 47% pow: 663.345 W 0: INFO 26-04-29 16:15:03.469319 - 0:39:44 - step: 16550 acc: 0 loss: 1.7773 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6194 data: 0.0846 lr: 4.98e-05 mem: 47% pow: 645.956 W 0: INFO 26-04-29 16:15:17.566924 - 0:39:58 - step: 16560 acc: 0 loss: 1.5515 grad: 1.60e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5876 data: 0.0945 lr: 4.98e-05 mem: 47% pow: 660.123 W 0: INFO 26-04-29 16:15:31.224370 - 0:40:12 - step: 16570 acc: 0 loss: 1.8628 grad: 1.59e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5991 data: 0.0908 lr: 4.97e-05 mem: 47% pow: 658.13 W 0: INFO 26-04-29 16:15:45.017878 - 0:40:25 - step: 16580 acc: 0 loss: 1.5658 grad: 1.52e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6195 data: 0.0781 lr: 4.97e-05 mem: 47% pow: 657.34 W 0: INFO 26-04-29 16:15:59.027611 - 0:40:39 - step: 16590 acc: 0 loss: 1.7607 grad: 1.62e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6276 data: 0.0851 lr: 4.97e-05 mem: 47% pow: 651.587 W 0: INFO 26-04-29 16:16:12.886018 - 0:40:53 - step: 16600 acc: 0 loss: 1.6273 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6029 data: 0.0881 lr: 4.97e-05 mem: 47% pow: 655.268 W 0: INFO 26-04-29 16:16:29.695910 - 0:41:10 - step: 16610 acc: 0 loss: 1.3228 grad: 1.52e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.8167 data: 0.0792 lr: 4.97e-05 mem: 54% pow: 542.58 W 0: INFO 26-04-29 16:16:43.477312 - 0:41:24 - step: 16620 acc: 0 loss: 1.4819 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5849 data: 0.1075 lr: 4.97e-05 mem: 47% pow: 653.808 W 0: INFO 26-04-29 16:16:57.135649 - 0:41:37 - step: 16630 acc: 0 loss: 1.9093 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6144 data: 0.0887 lr: 4.97e-05 mem: 47% pow: 658.733 W 0: INFO 26-04-29 16:17:10.910257 - 0:41:51 - step: 16640 acc: 0 loss: 1.2658 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5943 data: 0.0933 lr: 4.96e-05 mem: 47% pow: 669.614 W 0: INFO 26-04-29 16:17:24.878940 - 0:42:05 - step: 16650 acc: 0 loss: 1.4031 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.8108 data: 0.0865 lr: 4.96e-05 mem: 47% pow: 538.679 W 0: INFO 26-04-29 16:17:38.986491 - 0:42:19 - step: 16660 acc: 0 loss: 1.4969 grad: 1.73e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6053 data: 0.0858 lr: 4.96e-05 mem: 47% pow: 656.726 W 0: INFO 26-04-29 16:17:52.799508 - 0:42:33 - step: 16670 acc: 0 loss: 1.3866 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6046 data: 0.0942 lr: 4.96e-05 mem: 47% pow: 667.62 W 0: INFO 26-04-29 16:18:06.805824 - 0:42:47 - step: 16680 acc: 0 loss: 1.4539 grad: 1.53e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7052 data: 0.0875 lr: 4.96e-05 mem: 47% pow: 599.502 W 0: INFO 26-04-29 16:18:20.833432 - 0:43:01 - step: 16690 acc: 0 loss: 1.4011 grad: 1.63e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5888 data: 0.0914 lr: 4.96e-05 mem: 47% pow: 665.107 W 0: INFO 26-04-29 16:18:34.555577 - 0:43:15 - step: 16700 acc: 0 loss: 1.1644 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.624 data: 0.0904 lr: 4.96e-05 mem: 47% pow: 645.349 W 0: INFO 26-04-29 16:18:51.469507 - 0:43:32 - step: 16710 acc: 0 loss: 1.4502 grad: 1.52e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.62 data: 0.0857 lr: 4.95e-05 mem: 54% pow: 643.923 W 0: INFO 26-04-29 16:19:05.485537 - 0:43:46 - step: 16720 acc: 0 loss: 1.4101 grad: 1.59e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5986 data: 0.0896 lr: 4.95e-05 mem: 47% pow: 656.487 W 0: INFO 26-04-29 16:19:19.616301 - 0:44:00 - step: 16730 acc: 0 loss: 1.6787 grad: 1.48e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6153 data: 0.0883 lr: 4.95e-05 mem: 47% pow: 645.712 W 0: INFO 26-04-29 16:19:33.206197 - 0:44:14 - step: 16740 acc: 0 loss: 1.7371 grad: 1.54e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6252 data: 0.0886 lr: 4.95e-05 mem: 47% pow: 641.413 W 0: INFO 26-04-29 16:19:46.986030 - 0:44:27 - step: 16750 acc: 0 loss: 1.4874 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6027 data: 0.1017 lr: 4.95e-05 mem: 47% pow: 648.871 W 0: INFO 26-04-29 16:20:01.037971 - 0:44:41 - step: 16760 acc: 0 loss: 1.6358 grad: 1.50e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6163 data: 0.1083 lr: 4.95e-05 mem: 47% pow: 629.075 W 0: INFO 26-04-29 16:20:14.777438 - 0:44:55 - step: 16770 acc: 0 loss: 1.6636 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5847 data: 0.0897 lr: 4.94e-05 mem: 47% pow: 662.11 W 0: INFO 26-04-29 16:20:28.385533 - 0:45:09 - step: 16780 acc: 0 loss: 1.5993 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6207 data: 0.0924 lr: 4.94e-05 mem: 47% pow: 644.043 W 0: INFO 26-04-29 16:20:42.383808 - 0:45:23 - step: 16790 acc: 0 loss: 1.5583 grad: 1.47e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.5989 data: 0.0863 lr: 4.94e-05 mem: 47% pow: 663.074 W 0: INFO 26-04-29 16:20:56.466742 - 0:45:37 - step: 16800 acc: 0 loss: 1.2764 grad: 1.58e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6078 data: 0.0902 lr: 4.94e-05 mem: 47% pow: 646.586 W 0: INFO 26-04-29 16:21:13.495848 - 0:45:54 - step: 16810 acc: 0 loss: 1.1056 grad: 1.51e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.6446 data: 0.0983 lr: 4.94e-05 mem: 54% pow: 618.329 W 0: INFO 26-04-29 16:21:27.519439 - 0:46:08 - step: 16820 acc: 0 loss: 1.6373 grad: 1.48e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5817 data: 0.1179 lr: 4.94e-05 mem: 47% pow: 652.167 W 0: INFO 26-04-29 16:21:41.308912 - 0:46:22 - step: 16830 acc: 0 loss: 1.5669 grad: 1.58e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6633 data: 0.0925 lr: 4.94e-05 mem: 47% pow: 611.351 W 0: INFO 26-04-29 16:21:54.977260 - 0:46:35 - step: 16840 acc: 0 loss: 1.6549 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6059 data: 0.0796 lr: 4.93e-05 mem: 47% pow: 651.671 W 0: INFO 26-04-29 16:22:08.682638 - 0:46:49 - step: 16850 acc: 0 loss: 1.785 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5951 data: 0.0761 lr: 4.93e-05 mem: 47% pow: 662.747 W 0: INFO 26-04-29 16:22:22.780026 - 0:47:03 - step: 16860 acc: 0 loss: 1.5962 grad: 1.47e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6277 data: 0.0862 lr: 4.93e-05 mem: 47% pow: 595.466 W 0: INFO 26-04-29 16:22:36.611394 - 0:47:17 - step: 16870 acc: 0 loss: 1.4021 grad: 1.58e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5972 data: 0.0977 lr: 4.93e-05 mem: 47% pow: 652.522 W 0: INFO 26-04-29 16:22:50.478734 - 0:47:31 - step: 16880 acc: 0 loss: 1.5882 grad: 1.54e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6141 data: 0.053 lr: 4.93e-05 mem: 47% pow: 673.629 W 0: INFO 26-04-29 16:23:04.622540 - 0:47:45 - step: 16890 acc: 0 loss: 1.5298 grad: 1.66e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.7438 data: 0.0802 lr: 4.93e-05 mem: 47% pow: 583.124 W 0: INFO 26-04-29 16:23:18.864500 - 0:47:59 - step: 16900 acc: 0 loss: 1.7803 grad: 2.46e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6097 data: 0.0825 lr: 4.93e-05 mem: 47% pow: 645.177 W 0: INFO 26-04-29 16:23:35.408013 - 0:48:16 - step: 16910 acc: 0 loss: 1.5013 grad: 1.58e-01 flops: 3.42e+14 wps: 3.96e+04 iter: 0.583 data: 0.1025 lr: 4.92e-05 mem: 54% pow: 666.001 W 0: INFO 26-04-29 16:23:49.277249 - 0:48:30 - step: 16920 acc: 0 loss: 1.2702 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6195 data: 0.0665 lr: 4.92e-05 mem: 47% pow: 659.438 W 0: INFO 26-04-29 16:24:02.957370 - 0:48:43 - step: 16930 acc: 0 loss: 1.4796 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6461 data: 0.0953 lr: 4.92e-05 mem: 47% pow: 630.577 W 0: INFO 26-04-29 16:24:16.937625 - 0:48:57 - step: 16940 acc: 0 loss: 1.5458 grad: 2.21e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5956 data: 0.0882 lr: 4.92e-05 mem: 47% pow: 669.283 W 0: INFO 26-04-29 16:24:30.692388 - 0:49:11 - step: 16950 acc: 0 loss: 1.4683 grad: 1.70e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5822 data: 0.0897 lr: 4.92e-05 mem: 47% pow: 655.171 W 0: INFO 26-04-29 16:24:44.555011 - 0:49:25 - step: 16960 acc: 0 loss: 1.8667 grad: 1.43e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6016 data: 0.0759 lr: 4.92e-05 mem: 47% pow: 661.594 W 0: INFO 26-04-29 16:24:58.946658 - 0:49:39 - step: 16970 acc: 0 loss: 1.5664 grad: 1.50e-01 flops: 3.92e+14 wps: 4.56e+04 iter: 0.608 data: 0.0843 lr: 4.92e-05 mem: 47% pow: 650.85 W 0: INFO 26-04-29 16:25:13.339332 - 0:49:54 - step: 16980 acc: 0 loss: 1.5609 grad: 1.51e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5909 data: 0.0846 lr: 4.91e-05 mem: 47% pow: 679.273 W 0: INFO 26-04-29 16:25:27.277755 - 0:50:08 - step: 16990 acc: 0 loss: 1.5185 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6126 data: 0.0708 lr: 4.91e-05 mem: 47% pow: 656.624 W 0: INFO 26-04-29 16:25:41.565500 - 0:50:22 - step: 17000 acc: 0 loss: 1.2857 grad: 1.44e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7033 data: 0.0867 lr: 4.91e-05 mem: 47% pow: 610.08 W 0: INFO 26-04-29 16:25:45.294125 - 0:50:26 - garbage collection 0: INFO 26-04-29 16:25:59.939673 - 0:50:40 - step: 17010 acc: 0 loss: 1.4277 grad: 1.50e-01 flops: 3.07e+14 wps: 3.57e+04 iter: 0.6182 data: 0.089 lr: 4.91e-05 mem: 54% pow: 647.448 W 0: INFO 26-04-29 16:26:13.913568 - 0:50:54 - step: 17020 acc: 0 loss: 1.3693 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6446 data: 0.0473 lr: 4.91e-05 mem: 47% pow: 658.238 W 0: INFO 26-04-29 16:26:27.721722 - 0:51:08 - step: 17030 acc: 0 loss: 1.6956 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.624 data: 0.0837 lr: 4.91e-05 mem: 47% pow: 642.775 W 0: INFO 26-04-29 16:26:41.749383 - 0:51:22 - step: 17040 acc: 0 loss: 1.6548 grad: 1.44e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5985 data: 0.0939 lr: 4.90e-05 mem: 47% pow: 651.619 W 0: INFO 26-04-29 16:26:55.465354 - 0:51:36 - step: 17050 acc: 0 loss: 1.6671 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6293 data: 0.0952 lr: 4.90e-05 mem: 47% pow: 642.074 W 0: INFO 26-04-29 16:27:09.138231 - 0:51:49 - step: 17060 acc: 0 loss: 1.5244 grad: 1.69e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5896 data: 0.0862 lr: 4.90e-05 mem: 47% pow: 660.827 W 0: INFO 26-04-29 16:27:22.921632 - 0:52:03 - step: 17070 acc: 0 loss: 1.3193 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6358 data: 0.0743 lr: 4.90e-05 mem: 47% pow: 653.832 W 0: INFO 26-04-29 16:27:36.703794 - 0:52:17 - step: 17080 acc: 0 loss: 1.2096 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5949 data: 0.0937 lr: 4.90e-05 mem: 47% pow: 667.498 W 0: INFO 26-04-29 16:27:50.743103 - 0:52:31 - step: 17090 acc: 0 loss: 1.4015 grad: 1.80e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.7012 data: 0.0878 lr: 4.90e-05 mem: 47% pow: 604.439 W 0: INFO 26-04-29 16:28:04.317566 - 0:52:45 - step: 17100 acc: 0 loss: 1.6615 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6178 data: 0.0888 lr: 4.90e-05 mem: 47% pow: 651.809 W 0: INFO 26-04-29 16:28:21.260922 - 0:53:02 - step: 17110 acc: 0 loss: 1.5839 grad: 1.43e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.8347 data: 0.0873 lr: 4.89e-05 mem: 54% pow: 533.234 W 0: INFO 26-04-29 16:28:34.963409 - 0:53:15 - step: 17120 acc: 0 loss: 1.6762 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5832 data: 0.0896 lr: 4.89e-05 mem: 47% pow: 665.145 W 0: INFO 26-04-29 16:28:48.653270 - 0:53:29 - step: 17130 acc: 0 loss: 1.572 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5806 data: 0.1014 lr: 4.89e-05 mem: 47% pow: 657.953 W 0: INFO 26-04-29 16:29:02.745270 - 0:53:43 - step: 17140 acc: 0 loss: 1.1798 grad: 1.69e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.8297 data: 0.0034 lr: 4.89e-05 mem: 47% pow: 574.878 W 0: INFO 26-04-29 16:29:16.328426 - 0:53:57 - step: 17150 acc: 0 loss: 1.6648 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5839 data: 0.086 lr: 4.89e-05 mem: 47% pow: 675.753 W 0: INFO 26-04-29 16:29:30.437309 - 0:54:11 - step: 17160 acc: 0 loss: 1.3128 grad: 1.42e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.616 data: 0.0821 lr: 4.89e-05 mem: 47% pow: 653.505 W 0: INFO 26-04-29 16:29:44.034549 - 0:54:24 - step: 17170 acc: 0 loss: 1.503 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5865 data: 0.0896 lr: 4.89e-05 mem: 47% pow: 671.504 W 0: INFO 26-04-29 16:29:57.796873 - 0:54:38 - step: 17180 acc: 0 loss: 1.2333 grad: 1.67e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6118 data: 0.0897 lr: 4.88e-05 mem: 47% pow: 646.935 W 0: INFO 26-04-29 16:30:11.562376 - 0:54:52 - step: 17190 acc: 0 loss: 1.2369 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6426 data: 0.1054 lr: 4.88e-05 mem: 47% pow: 622.311 W 0: INFO 26-04-29 16:30:25.568883 - 0:55:06 - step: 17200 acc: 0 loss: 1.2235 grad: 1.46e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6036 data: 0.0866 lr: 4.88e-05 mem: 47% pow: 655.992 W 0: INFO 26-04-29 16:30:42.543756 - 0:55:23 - step: 17210 acc: 0 loss: 1.1783 grad: 1.57e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.5785 data: 0.1119 lr: 4.88e-05 mem: 54% pow: 664.341 W 0: INFO 26-04-29 16:30:56.416819 - 0:55:37 - step: 17220 acc: 0 loss: 1.4205 grad: 1.53e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5965 data: 0.0867 lr: 4.88e-05 mem: 47% pow: 658.772 W 0: INFO 26-04-29 16:31:10.049806 - 0:55:50 - step: 17230 acc: 0 loss: 1.3563 grad: 1.45e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6072 data: 0.0801 lr: 4.88e-05 mem: 47% pow: 667.213 W 0: INFO 26-04-29 16:31:24.046681 - 0:56:04 - step: 17240 acc: 0 loss: 1.3275 grad: 1.54e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6097 data: 0.0864 lr: 4.87e-05 mem: 47% pow: 649.699 W 0: INFO 26-04-29 16:31:38.304507 - 0:56:19 - step: 17250 acc: 0 loss: 1.3535 grad: 1.60e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 1.0609 data: 0.0716 lr: 4.87e-05 mem: 47% pow: 411.78 W 0: INFO 26-04-29 16:31:52.197736 - 0:56:32 - step: 17260 acc: 0 loss: 1.4113 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5996 data: 0.079 lr: 4.87e-05 mem: 47% pow: 665.462 W 0: INFO 26-04-29 16:32:06.159723 - 0:56:46 - step: 17270 acc: 0 loss: 1.273 grad: 1.54e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.596 data: 0.0913 lr: 4.87e-05 mem: 47% pow: 658.865 W 0: INFO 26-04-29 16:32:20.014646 - 0:57:00 - step: 17280 acc: 0 loss: 1.7009 grad: 1.55e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6226 data: 0.0926 lr: 4.87e-05 mem: 47% pow: 639.22 W 0: INFO 26-04-29 16:32:34.008008 - 0:57:14 - step: 17290 acc: 0 loss: 1.2611 grad: 1.44e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6669 data: 0.0848 lr: 4.87e-05 mem: 47% pow: 616.149 W 0: INFO 26-04-29 16:32:47.910441 - 0:57:28 - step: 17300 acc: 0 loss: 1.5426 grad: 1.51e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.629 data: 0.0808 lr: 4.87e-05 mem: 47% pow: 644.74 W 0: INFO 26-04-29 16:33:04.663661 - 0:57:45 - step: 17310 acc: 0 loss: 1.4212 grad: 1.41e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5768 data: 0.0937 lr: 4.86e-05 mem: 54% pow: 666.398 W 0: INFO 26-04-29 16:33:18.351850 - 0:57:59 - step: 17320 acc: 0 loss: 1.7196 grad: 1.43e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6711 data: 0.0845 lr: 4.86e-05 mem: 47% pow: 626.12 W 0: INFO 26-04-29 16:33:32.028342 - 0:58:12 - step: 17330 acc: 0 loss: 1.2715 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6408 data: 0.0619 lr: 4.86e-05 mem: 47% pow: 659.781 W 0: INFO 26-04-29 16:33:46.146265 - 0:58:26 - step: 17340 acc: 0 loss: 1.3954 grad: 1.59e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6267 data: 0.0897 lr: 4.86e-05 mem: 47% pow: 645.1 W 0: INFO 26-04-29 16:33:59.749774 - 0:58:40 - step: 17350 acc: 0 loss: 1.2445 grad: 1.62e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6085 data: 0.0857 lr: 4.86e-05 mem: 47% pow: 656.977 W 0: INFO 26-04-29 16:34:14.135412 - 0:58:54 - step: 17360 acc: 0 loss: 1.3859 grad: 1.51e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6614 data: 0.0817 lr: 4.86e-05 mem: 47% pow: 630.915 W 0: INFO 26-04-29 16:34:28.457239 - 0:59:09 - step: 17370 acc: 0 loss: 1.4926 grad: 1.52e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6777 data: 0.0855 lr: 4.86e-05 mem: 47% pow: 609.082 W 0: INFO 26-04-29 16:34:42.095141 - 0:59:22 - step: 17380 acc: 0 loss: 1.1736 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6085 data: 0.0871 lr: 4.85e-05 mem: 47% pow: 651.586 W 0: INFO 26-04-29 16:34:55.867067 - 0:59:36 - step: 17390 acc: 0 loss: 1.8166 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6647 data: 0.0669 lr: 4.85e-05 mem: 47% pow: 629.728 W 0: INFO 26-04-29 16:35:09.718081 - 0:59:50 - step: 17400 acc: 0 loss: 1.3528 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.636 data: 0.0862 lr: 4.85e-05 mem: 47% pow: 634.801 W 0: INFO 26-04-29 16:35:26.554301 - 1:00:07 - step: 17410 acc: 0 loss: 1.6756 grad: 1.75e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6076 data: 0.0826 lr: 4.85e-05 mem: 54% pow: 656.045 W 0: INFO 26-04-29 16:35:40.454150 - 1:00:21 - step: 17420 acc: 0 loss: 1.0651 grad: 1.92e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5958 data: 0.0814 lr: 4.85e-05 mem: 47% pow: 663.011 W 0: INFO 26-04-29 16:35:54.652655 - 1:00:35 - step: 17430 acc: 0 loss: 1.7374 grad: 1.78e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7385 data: 0.0602 lr: 4.85e-05 mem: 47% pow: 594.849 W 0: INFO 26-04-29 16:36:08.703016 - 1:00:49 - step: 17440 acc: 0 loss: 1.5997 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6762 data: 0.0671 lr: 4.85e-05 mem: 47% pow: 632.033 W 0: INFO 26-04-29 16:36:22.626270 - 1:01:03 - step: 17450 acc: 0 loss: 1.2149 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6046 data: 0.09 lr: 4.84e-05 mem: 47% pow: 649.315 W 0: INFO 26-04-29 16:36:36.509359 - 1:01:17 - step: 17460 acc: 0 loss: 1.5452 grad: 1.56e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6515 data: 0.0242 lr: 4.84e-05 mem: 47% pow: 658.095 W 0: INFO 26-04-29 16:36:50.222299 - 1:01:31 - step: 17470 acc: 0 loss: 1.5485 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.597 data: 0.0863 lr: 4.84e-05 mem: 47% pow: 653.764 W 0: INFO 26-04-29 16:37:04.096720 - 1:01:44 - step: 17480 acc: 0 loss: 1.2044 grad: 1.81e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6059 data: 0.0862 lr: 4.84e-05 mem: 47% pow: 654.925 W 0: INFO 26-04-29 16:37:17.877563 - 1:01:58 - step: 17490 acc: 0 loss: 1.5346 grad: 1.70e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6022 data: 0.0835 lr: 4.84e-05 mem: 47% pow: 659.808 W 0: INFO 26-04-29 16:37:31.933929 - 1:02:12 - step: 17500 acc: 0 loss: 1.1019 grad: 1.57e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6326 data: 0.0863 lr: 4.84e-05 mem: 47% pow: 635.219 W 0: INFO 26-04-29 16:37:48.422545 - 1:02:29 - step: 17510 acc: 0 loss: 1.0585 grad: 1.54e-01 flops: 3.42e+14 wps: 3.98e+04 iter: 0.6197 data: 0.0892 lr: 4.83e-05 mem: 54% pow: 648.452 W 0: INFO 26-04-29 16:38:02.438472 - 1:02:43 - step: 17520 acc: 0 loss: 1.7137 grad: 1.58e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6977 data: 0.0896 lr: 4.83e-05 mem: 47% pow: 606.61 W 0: INFO 26-04-29 16:38:16.395499 - 1:02:57 - step: 17530 acc: 0 loss: 1.2785 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6796 data: 0.0843 lr: 4.83e-05 mem: 47% pow: 613.758 W 0: INFO 26-04-29 16:38:30.395293 - 1:03:11 - step: 17540 acc: 0 loss: 1.1237 grad: 1.54e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6015 data: 0.0827 lr: 4.83e-05 mem: 47% pow: 658.858 W 0: INFO 26-04-29 16:38:44.549479 - 1:03:25 - step: 17550 acc: 0 loss: 1.4403 grad: 1.59e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5986 data: 0.0863 lr: 4.83e-05 mem: 47% pow: 662.904 W 0: INFO 26-04-29 16:38:58.389741 - 1:03:39 - step: 17560 acc: 0 loss: 1.5812 grad: 3.04e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5991 data: 0.0923 lr: 4.83e-05 mem: 47% pow: 650.026 W 0: INFO 26-04-29 16:39:12.241674 - 1:03:53 - step: 17570 acc: 0 loss: 1.3177 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6063 data: 0.0948 lr: 4.83e-05 mem: 47% pow: 653.155 W 0: INFO 26-04-29 16:39:25.868149 - 1:04:06 - step: 17580 acc: 0 loss: 1.5146 grad: 1.79e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5908 data: 0.0838 lr: 4.82e-05 mem: 47% pow: 656.935 W 0: INFO 26-04-29 16:39:39.538325 - 1:04:20 - step: 17590 acc: 0 loss: 1.1467 grad: 1.48e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6145 data: 0.0889 lr: 4.82e-05 mem: 47% pow: 655.565 W 0: INFO 26-04-29 16:39:53.346052 - 1:04:34 - step: 17600 acc: 0 loss: 1.2618 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6006 data: 0.0905 lr: 4.82e-05 mem: 47% pow: 660.645 W 0: INFO 26-04-29 16:40:10.329579 - 1:04:51 - step: 17610 acc: 0 loss: 1.3676 grad: 1.51e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.6131 data: 0.08 lr: 4.82e-05 mem: 54% pow: 659.515 W 0: INFO 26-04-29 16:40:24.081577 - 1:05:04 - step: 17620 acc: 0 loss: 1.3613 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.591 data: 0.0933 lr: 4.82e-05 mem: 47% pow: 662.234 W 0: INFO 26-04-29 16:40:37.853787 - 1:05:18 - step: 17630 acc: 0 loss: 1.5662 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6147 data: 0.0897 lr: 4.82e-05 mem: 47% pow: 658.683 W 0: INFO 26-04-29 16:40:51.985382 - 1:05:32 - step: 17640 acc: 0 loss: 1.1573 grad: 1.53e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.7494 data: 0.0814 lr: 4.82e-05 mem: 47% pow: 579.821 W 0: INFO 26-04-29 16:41:06.177879 - 1:05:46 - step: 17650 acc: 0 loss: 1.7754 grad: 1.68e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6009 data: 0.0946 lr: 4.81e-05 mem: 47% pow: 655.374 W 0: INFO 26-04-29 16:41:19.844810 - 1:06:00 - step: 17660 acc: 0 loss: 1.5277 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5819 data: 0.1028 lr: 4.81e-05 mem: 47% pow: 673.451 W 0: INFO 26-04-29 16:41:33.811709 - 1:06:14 - step: 17670 acc: 0 loss: 0.9616 grad: 1.66e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6235 data: 0.0583 lr: 4.81e-05 mem: 47% pow: 660.568 W 0: INFO 26-04-29 16:41:47.854188 - 1:06:28 - step: 17680 acc: 0 loss: 1.4052 grad: 1.47e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6033 data: 0.0751 lr: 4.81e-05 mem: 47% pow: 662.653 W 0: INFO 26-04-29 16:42:01.852898 - 1:06:42 - step: 17690 acc: 0 loss: 1.4841 grad: 1.59e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6076 data: 0.0861 lr: 4.81e-05 mem: 47% pow: 646.163 W 0: INFO 26-04-29 16:42:15.943387 - 1:06:56 - step: 17700 acc: 0 loss: 1.7475 grad: 1.72e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.7681 data: 0.0825 lr: 4.81e-05 mem: 47% pow: 572.427 W 0: INFO 26-04-29 16:42:32.728182 - 1:07:13 - step: 17710 acc: 0 loss: 1.093 grad: 1.59e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6047 data: 0.0775 lr: 4.80e-05 mem: 54% pow: 662.154 W 0: INFO 26-04-29 16:42:46.681856 - 1:07:27 - step: 17720 acc: 0 loss: 1.5323 grad: 1.54e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6371 data: 0.0878 lr: 4.80e-05 mem: 47% pow: 633.211 W 0: INFO 26-04-29 16:43:00.628718 - 1:07:41 - step: 17730 acc: 0 loss: 1.4517 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5923 data: 0.0938 lr: 4.80e-05 mem: 47% pow: 655.946 W 0: INFO 26-04-29 16:43:14.548761 - 1:07:55 - step: 17740 acc: 0 loss: 1.5527 grad: 1.54e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5837 data: 0.0903 lr: 4.80e-05 mem: 47% pow: 663.245 W 0: INFO 26-04-29 16:43:28.146190 - 1:08:08 - step: 17750 acc: 0 loss: 1.3345 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6466 data: 0.0853 lr: 4.80e-05 mem: 47% pow: 626.806 W 0: INFO 26-04-29 16:43:42.270648 - 1:08:23 - step: 17760 acc: 0 loss: 1.525 grad: 1.42e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6917 data: 0.0032 lr: 4.80e-05 mem: 47% pow: 656.729 W 0: INFO 26-04-29 16:43:56.246938 - 1:08:37 - step: 17770 acc: 0 loss: 1.1805 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6423 data: 0.0697 lr: 4.80e-05 mem: 47% pow: 636.783 W 0: INFO 26-04-29 16:44:09.895059 - 1:08:50 - step: 17780 acc: 0 loss: 1.3584 grad: 1.89e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5952 data: 0.0854 lr: 4.79e-05 mem: 47% pow: 664.78 W 0: INFO 26-04-29 16:44:24.164474 - 1:09:04 - step: 17790 acc: 0 loss: 1.6761 grad: 1.54e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6037 data: 0.0821 lr: 4.79e-05 mem: 47% pow: 664.375 W 0: INFO 26-04-29 16:44:37.995109 - 1:09:18 - step: 17800 acc: 0 loss: 1.3524 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5925 data: 0.0899 lr: 4.79e-05 mem: 47% pow: 659.597 W 0: INFO 26-04-29 16:44:54.608063 - 1:09:35 - step: 17810 acc: 0 loss: 1.5973 grad: 1.54e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6046 data: 0.0917 lr: 4.79e-05 mem: 54% pow: 650.661 W 0: INFO 26-04-29 16:45:08.417016 - 1:09:49 - step: 17820 acc: 0 loss: 1.3797 grad: 1.54e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6161 data: 0.0826 lr: 4.79e-05 mem: 47% pow: 648.051 W 0: INFO 26-04-29 16:45:21.966898 - 1:10:02 - step: 17830 acc: 0 loss: 1.2981 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5966 data: 0.0861 lr: 4.79e-05 mem: 47% pow: 661.101 W 0: INFO 26-04-29 16:45:35.985755 - 1:10:16 - step: 17840 acc: 0 loss: 1.6538 grad: 1.64e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6052 data: 0.0854 lr: 4.79e-05 mem: 47% pow: 645.339 W 0: INFO 26-04-29 16:45:49.672898 - 1:10:30 - step: 17850 acc: 0 loss: 1.4688 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.616 data: 0.0849 lr: 4.78e-05 mem: 47% pow: 648.811 W 0: INFO 26-04-29 16:46:03.469206 - 1:10:44 - step: 17860 acc: 0 loss: 1.5764 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5804 data: 0.1313 lr: 4.78e-05 mem: 47% pow: 643.469 W 0: INFO 26-04-29 16:46:17.164585 - 1:10:57 - step: 17870 acc: 0 loss: 1.1228 grad: 1.47e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6084 data: 0.0828 lr: 4.78e-05 mem: 47% pow: 659.941 W 0: INFO 26-04-29 16:46:31.092886 - 1:11:11 - step: 17880 acc: 0 loss: 1.378 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5887 data: 0.0877 lr: 4.78e-05 mem: 47% pow: 662.552 W 0: INFO 26-04-29 16:46:45.487894 - 1:11:26 - step: 17890 acc: 0 loss: 1.493 grad: 1.52e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.8684 data: 0.0892 lr: 4.78e-05 mem: 47% pow: 499.475 W 0: INFO 26-04-29 16:46:59.355710 - 1:11:40 - step: 17900 acc: 0 loss: 1.5761 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5853 data: 0.0855 lr: 4.78e-05 mem: 47% pow: 671.723 W 0: INFO 26-04-29 16:47:19.984863 - 1:12:00 - step: 17910 acc: 0 loss: 1.6107 grad: 1.51e-01 flops: 2.74e+14 wps: 3.18e+04 iter: 4.7397 data: 0.0918 lr: 4.78e-05 mem: 54% pow: 424.037 W 0: INFO 26-04-29 16:47:33.769238 - 1:12:14 - step: 17920 acc: 0 loss: 1.2602 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5809 data: 0.0923 lr: 4.77e-05 mem: 47% pow: 663.269 W 0: INFO 26-04-29 16:47:48.089140 - 1:12:28 - step: 17930 acc: 0 loss: 1.5272 grad: 1.63e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.589 data: 0.0882 lr: 4.77e-05 mem: 47% pow: 660.733 W 0: INFO 26-04-29 16:48:01.869016 - 1:12:42 - step: 17940 acc: 0 loss: 1.48 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5847 data: 0.085 lr: 4.77e-05 mem: 47% pow: 673.463 W 0: INFO 26-04-29 16:48:15.728415 - 1:12:56 - step: 17950 acc: 0 loss: 1.7366 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6073 data: 0.0819 lr: 4.77e-05 mem: 47% pow: 653.416 W 0: INFO 26-04-29 16:48:29.383593 - 1:13:10 - step: 17960 acc: 0 loss: 1.2263 grad: 1.54e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6049 data: 0.0803 lr: 4.77e-05 mem: 47% pow: 658.6 W 0: INFO 26-04-29 16:48:43.404178 - 1:13:24 - step: 17970 acc: 0 loss: 1.6388 grad: 1.48e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.7176 data: 0.0883 lr: 4.77e-05 mem: 47% pow: 589.008 W 0: INFO 26-04-29 16:48:58.727416 - 1:13:39 - step: 17980 acc: 0 loss: 1.3581 grad: 1.49e-01 flops: 3.69e+14 wps: 4.28e+04 iter: 0.6351 data: 0.079 lr: 4.76e-05 mem: 47% pow: 644.715 W 0: INFO 26-04-29 16:49:13.237510 - 1:13:54 - step: 17990 acc: 0 loss: 1.2134 grad: 1.47e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6214 data: 0.0797 lr: 4.76e-05 mem: 47% pow: 658.585 W 0: INFO 26-04-29 16:49:27.056221 - 1:14:07 - step: 18000 acc: 0 loss: 1.3843 grad: 1.73e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5901 data: 0.0937 lr: 4.76e-05 mem: 47% pow: 660.226 W 0: INFO 26-04-29 16:49:30.708856 - 1:14:11 - garbage collection 0: INFO 26-04-29 16:49:45.354189 - 1:14:26 - step: 18010 acc: 0 loss: 1.4056 grad: 1.49e-01 flops: 3.09e+14 wps: 3.58e+04 iter: 0.593 data: 0.1273 lr: 4.76e-05 mem: 54% pow: 635.281 W 0: INFO 26-04-29 16:49:59.205074 - 1:14:40 - step: 18020 acc: 0 loss: 1.4183 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.653 data: 0.0712 lr: 4.76e-05 mem: 47% pow: 653.055 W 0: INFO 26-04-29 16:50:13.191903 - 1:14:53 - step: 18030 acc: 0 loss: 1.052 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.9189 data: 0.0728 lr: 4.76e-05 mem: 47% pow: 489.182 W 0: INFO 26-04-29 16:50:26.941325 - 1:15:07 - step: 18040 acc: 0 loss: 1.5431 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5993 data: 0.0859 lr: 4.76e-05 mem: 47% pow: 655.22 W 0: INFO 26-04-29 16:50:41.011109 - 1:15:21 - step: 18050 acc: 0 loss: 1.181 grad: 1.55e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.668 data: 0.0032 lr: 4.75e-05 mem: 47% pow: 671.533 W 0: INFO 26-04-29 16:50:55.808220 - 1:15:36 - step: 18060 acc: 0 loss: 1.3902 grad: 1.71e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6091 data: 0.0803 lr: 4.75e-05 mem: 47% pow: 658.86 W 0: INFO 26-04-29 16:51:09.688593 - 1:15:50 - step: 18070 acc: 0 loss: 1.8167 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6127 data: 0.0825 lr: 4.75e-05 mem: 47% pow: 654.004 W 0: INFO 26-04-29 16:51:24.165668 - 1:16:04 - step: 18080 acc: 0 loss: 1.6309 grad: 1.62e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.5967 data: 0.079 lr: 4.75e-05 mem: 47% pow: 690.128 W 0: INFO 26-04-29 16:51:39.642087 - 1:16:20 - step: 18090 acc: 0 loss: 1.9603 grad: 1.57e-01 flops: 3.65e+14 wps: 4.24e+04 iter: 0.7679 data: 0.0427 lr: 4.75e-05 mem: 47% pow: 589.542 W 0: INFO 26-04-29 16:51:54.164959 - 1:16:34 - step: 18100 acc: 0 loss: 1.4621 grad: 1.54e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 1.2285 data: 0.1002 lr: 4.75e-05 mem: 47% pow: 426.551 W 0: INFO 26-04-29 16:52:10.882949 - 1:16:51 - step: 18110 acc: 0 loss: 1.4429 grad: 1.48e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6133 data: 0.0983 lr: 4.75e-05 mem: 54% pow: 640.274 W 0: INFO 26-04-29 16:52:25.268738 - 1:17:06 - step: 18120 acc: 0 loss: 1.5054 grad: 1.47e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6346 data: 0.0758 lr: 4.74e-05 mem: 47% pow: 642.828 W 0: INFO 26-04-29 16:52:39.074246 - 1:17:19 - step: 18130 acc: 0 loss: 1.7928 grad: 1.56e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6027 data: 0.091 lr: 4.74e-05 mem: 47% pow: 653.901 W 0: INFO 26-04-29 16:52:54.122709 - 1:17:34 - step: 18140 acc: 0 loss: 1.2916 grad: 1.46e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.6146 data: 0.089 lr: 4.74e-05 mem: 47% pow: 650.631 W 0: INFO 26-04-29 16:53:07.997816 - 1:17:48 - step: 18150 acc: 0 loss: 1.2891 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6301 data: 0.0762 lr: 4.74e-05 mem: 47% pow: 651.129 W 0: INFO 26-04-29 16:53:21.838690 - 1:18:02 - step: 18160 acc: 0 loss: 1.1644 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7381 data: 0.0845 lr: 4.74e-05 mem: 47% pow: 583.843 W 0: INFO 26-04-29 16:53:42.585106 - 1:18:23 - step: 18170 acc: 0 loss: 1.4925 grad: 1.56e-01 flops: 2.72e+14 wps: 3.16e+04 iter: 0.5902 data: 0.0921 lr: 4.74e-05 mem: 47% pow: 656.816 W 0: INFO 26-04-29 16:53:56.471197 - 1:18:37 - step: 18180 acc: 0 loss: 1.5561 grad: 1.41e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5945 data: 0.0972 lr: 4.73e-05 mem: 47% pow: 654.192 W 0: INFO 26-04-29 16:54:11.063619 - 1:18:51 - step: 18190 acc: 0 loss: 1.4037 grad: 1.48e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.5992 data: 0.0722 lr: 4.73e-05 mem: 47% pow: 659.977 W 0: INFO 26-04-29 16:54:25.706691 - 1:19:06 - step: 18200 acc: 0 loss: 1.3222 grad: 1.50e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6217 data: 0.0777 lr: 4.73e-05 mem: 47% pow: 641.402 W 0: INFO 26-04-29 16:54:42.611863 - 1:19:23 - step: 18210 acc: 0 loss: 1.4097 grad: 1.50e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6632 data: 0.0858 lr: 4.73e-05 mem: 54% pow: 633.805 W 0: INFO 26-04-29 16:54:56.232784 - 1:19:37 - step: 18220 acc: 0 loss: 1.6423 grad: 1.45e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5892 data: 0.0805 lr: 4.73e-05 mem: 47% pow: 666.917 W 0: INFO 26-04-29 16:55:10.668977 - 1:19:51 - step: 18230 acc: 0 loss: 1.5678 grad: 1.62e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6339 data: 0.0803 lr: 4.73e-05 mem: 47% pow: 646.851 W 0: INFO 26-04-29 16:55:27.675485 - 1:20:08 - step: 18240 acc: 0 loss: 1.6024 grad: 1.45e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.5915 data: 0.0791 lr: 4.73e-05 mem: 47% pow: 664.034 W 0: INFO 26-04-29 16:55:47.601458 - 1:20:28 - step: 18250 acc: 0 loss: 1.3959 grad: 1.50e-01 flops: 2.85e+14 wps: 3.30e+04 iter: 0.5874 data: 0.0843 lr: 4.72e-05 mem: 47% pow: 661.382 W 0: INFO 26-04-29 16:56:01.557571 - 1:20:42 - step: 18260 acc: 0 loss: 1.4644 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5991 data: 0.0778 lr: 4.72e-05 mem: 47% pow: 664.028 W 0: INFO 26-04-29 16:56:15.598291 - 1:20:56 - step: 18270 acc: 0 loss: 1.1919 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5844 data: 0.1202 lr: 4.72e-05 mem: 47% pow: 654.182 W 0: INFO 26-04-29 16:56:30.047314 - 1:21:10 - step: 18280 acc: 0 loss: 1.3418 grad: 1.59e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6058 data: 0.0844 lr: 4.72e-05 mem: 47% pow: 667.152 W 0: INFO 26-04-29 16:56:44.309870 - 1:21:25 - step: 18290 acc: 0 loss: 1.5167 grad: 1.47e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6098 data: 0.0861 lr: 4.72e-05 mem: 47% pow: 649.534 W 0: INFO 26-04-29 16:56:58.040724 - 1:21:38 - step: 18300 acc: 0 loss: 1.4457 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5824 data: 0.0868 lr: 4.72e-05 mem: 47% pow: 671.029 W 0: INFO 26-04-29 16:57:14.988135 - 1:21:55 - step: 18310 acc: 0 loss: 1.1168 grad: 1.49e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6416 data: 0.0865 lr: 4.72e-05 mem: 54% pow: 632.107 W 0: INFO 26-04-29 16:57:37.617824 - 1:22:18 - step: 18320 acc: 0 loss: 1.5948 grad: 1.51e-01 flops: 2.50e+14 wps: 2.90e+04 iter: 0.6358 data: 0.0828 lr: 4.71e-05 mem: 47% pow: 643.926 W 0: INFO 26-04-29 16:57:52.596401 - 1:22:33 - step: 18330 acc: 0 loss: 1.2242 grad: 1.44e-01 flops: 3.77e+14 wps: 4.38e+04 iter: 0.5894 data: 0.0869 lr: 4.71e-05 mem: 47% pow: 660.514 W 0: INFO 26-04-29 16:58:08.194504 - 1:22:48 - step: 18340 acc: 0 loss: 1.4416 grad: 1.55e-01 flops: 3.62e+14 wps: 4.20e+04 iter: 0.6019 data: 0.0857 lr: 4.71e-05 mem: 47% pow: 658.432 W 0: INFO 26-04-29 16:58:22.154515 - 1:23:02 - step: 18350 acc: 0 loss: 1.5045 grad: 1.55e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6261 data: 0.094 lr: 4.71e-05 mem: 47% pow: 634.249 W 0: INFO 26-04-29 16:58:36.206808 - 1:23:17 - step: 18360 acc: 0 loss: 1.2458 grad: 1.56e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.706 data: 0.0776 lr: 4.71e-05 mem: 47% pow: 600.053 W 0: INFO 26-04-29 16:58:50.776977 - 1:23:31 - step: 18370 acc: 0 loss: 1.2571 grad: 1.55e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6076 data: 0.0895 lr: 4.71e-05 mem: 47% pow: 649.984 W 0: INFO 26-04-29 16:59:04.899543 - 1:23:45 - step: 18380 acc: 0 loss: 1.4389 grad: 1.44e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5938 data: 0.0919 lr: 4.71e-05 mem: 47% pow: 659.558 W 0: INFO 26-04-29 16:59:21.071222 - 1:24:01 - step: 18390 acc: 0 loss: 1.2404 grad: 1.48e-01 flops: 3.49e+14 wps: 4.05e+04 iter: 0.6693 data: 0.0806 lr: 4.70e-05 mem: 47% pow: 621.577 W 0: INFO 26-04-29 16:59:34.927519 - 1:24:15 - step: 18400 acc: 0 loss: 1.3099 grad: 1.46e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6983 data: 0.0349 lr: 4.70e-05 mem: 47% pow: 626.696 W 0: INFO 26-04-29 16:59:52.013186 - 1:24:32 - step: 18410 acc: 0 loss: 1.7328 grad: 1.65e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.6299 data: 0.0862 lr: 4.70e-05 mem: 54% pow: 639.226 W 0: INFO 26-04-29 17:00:06.388519 - 1:24:47 - step: 18420 acc: 0 loss: 1.527 grad: 1.55e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6274 data: 0.0681 lr: 4.70e-05 mem: 47% pow: 652.128 W 0: INFO 26-04-29 17:00:20.389312 - 1:25:01 - step: 18430 acc: 0 loss: 1.978 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6123 data: 0.0942 lr: 4.70e-05 mem: 47% pow: 646.901 W 0: INFO 26-04-29 17:00:34.963080 - 1:25:15 - step: 18440 acc: 0 loss: 1.4188 grad: 1.64e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.5936 data: 0.0772 lr: 4.70e-05 mem: 47% pow: 668.321 W 0: INFO 26-04-29 17:00:48.955646 - 1:25:29 - step: 18450 acc: 0 loss: 1.5519 grad: 1.49e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7682 data: 0.0839 lr: 4.69e-05 mem: 47% pow: 567.099 W 0: INFO 26-04-29 17:01:03.089678 - 1:25:43 - step: 18460 acc: 0 loss: 1.48 grad: 1.46e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6393 data: 0.0906 lr: 4.69e-05 mem: 47% pow: 621.275 W 0: INFO 26-04-29 17:01:18.240521 - 1:25:59 - step: 18470 acc: 0 loss: 1.6236 grad: 1.49e-01 flops: 3.73e+14 wps: 4.33e+04 iter: 0.6326 data: 0.0918 lr: 4.69e-05 mem: 47% pow: 641.185 W 0: INFO 26-04-29 17:01:32.747732 - 1:26:13 - step: 18480 acc: 0 loss: 1.4388 grad: 1.47e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6034 data: 0.0818 lr: 4.69e-05 mem: 47% pow: 678.348 W 0: INFO 26-04-29 17:01:50.059418 - 1:26:30 - step: 18490 acc: 0 loss: 1.2787 grad: 1.70e-01 flops: 3.26e+14 wps: 3.79e+04 iter: 0.6029 data: 0.0785 lr: 4.69e-05 mem: 47% pow: 659.669 W 0: INFO 26-04-29 17:02:04.184317 - 1:26:44 - step: 18500 acc: 0 loss: 1.5127 grad: 1.49e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5974 data: 0.0974 lr: 4.69e-05 mem: 47% pow: 646.984 W 0: INFO 26-04-29 17:02:21.597727 - 1:27:02 - step: 18510 acc: 0 loss: 1.3667 grad: 1.43e-01 flops: 3.24e+14 wps: 3.77e+04 iter: 0.6721 data: 0.0655 lr: 4.69e-05 mem: 54% pow: 625.399 W 0: INFO 26-04-29 17:02:36.106517 - 1:27:16 - step: 18520 acc: 0 loss: 1.3456 grad: 1.43e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.5946 data: 0.0911 lr: 4.68e-05 mem: 47% pow: 661.177 W 0: INFO 26-04-29 17:02:50.713656 - 1:27:31 - step: 18530 acc: 0 loss: 1.4045 grad: 1.52e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6571 data: 0.0717 lr: 4.68e-05 mem: 47% pow: 633.631 W 0: INFO 26-04-29 17:03:06.148602 - 1:27:46 - step: 18540 acc: 0 loss: 1.6431 grad: 1.50e-01 flops: 3.66e+14 wps: 4.25e+04 iter: 0.5968 data: 0.0873 lr: 4.68e-05 mem: 47% pow: 660.543 W 0: INFO 26-04-29 17:03:19.949258 - 1:28:00 - step: 18550 acc: 0 loss: 1.0914 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6227 data: 0.0918 lr: 4.68e-05 mem: 47% pow: 636.622 W 0: INFO 26-04-29 17:03:34.684525 - 1:28:15 - step: 18560 acc: 0 loss: 1.3767 grad: 1.51e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6355 data: 0.0668 lr: 4.68e-05 mem: 47% pow: 647.538 W 0: INFO 26-04-29 17:03:48.886447 - 1:28:29 - step: 18570 acc: 0 loss: 1.1665 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5792 data: 0.0926 lr: 4.68e-05 mem: 47% pow: 663.223 W 0: INFO 26-04-29 17:04:04.081950 - 1:28:44 - step: 18580 acc: 0 loss: 1.6057 grad: 1.61e-01 flops: 3.72e+14 wps: 4.31e+04 iter: 0.5959 data: 0.0898 lr: 4.68e-05 mem: 47% pow: 657.017 W 0: INFO 26-04-29 17:04:21.565911 - 1:29:02 - step: 18590 acc: 0 loss: 1.6686 grad: 1.74e-01 flops: 3.23e+14 wps: 3.75e+04 iter: 3.2827 data: 0.0896 lr: 4.67e-05 mem: 47% pow: 434.966 W 0: INFO 26-04-29 17:04:36.169619 - 1:29:16 - step: 18600 acc: 0 loss: 1.7923 grad: 1.48e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.7961 data: 0.0964 lr: 4.67e-05 mem: 47% pow: 540.108 W 0: INFO 26-04-29 17:04:53.284605 - 1:29:34 - step: 18610 acc: 0 loss: 1.6821 grad: 1.50e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6053 data: 0.0844 lr: 4.67e-05 mem: 54% pow: 655.841 W 0: INFO 26-04-29 17:05:07.378062 - 1:29:48 - step: 18620 acc: 0 loss: 1.7736 grad: 1.43e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6808 data: 0.0902 lr: 4.67e-05 mem: 47% pow: 608.692 W 0: INFO 26-04-29 17:05:21.845526 - 1:30:02 - step: 18630 acc: 0 loss: 1.291 grad: 1.54e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.5877 data: 0.0848 lr: 4.67e-05 mem: 47% pow: 663.993 W 0: INFO 26-04-29 17:05:35.762486 - 1:30:16 - step: 18640 acc: 0 loss: 1.4468 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5779 data: 0.0927 lr: 4.67e-05 mem: 47% pow: 681.551 W 0: INFO 26-04-29 17:05:52.193938 - 1:30:32 - step: 18650 acc: 0 loss: 1.4316 grad: 1.42e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6163 data: 0.0726 lr: 4.67e-05 mem: 47% pow: 660.771 W 0: INFO 26-04-29 17:06:06.038474 - 1:30:46 - step: 18660 acc: 0 loss: 1.5971 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5984 data: 0.1214 lr: 4.66e-05 mem: 47% pow: 631.028 W 0: INFO 26-04-29 17:06:22.406543 - 1:31:03 - step: 18670 acc: 0 loss: 1.3755 grad: 1.49e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.6032 data: 0.0898 lr: 4.66e-05 mem: 47% pow: 661.525 W 0: INFO 26-04-29 17:06:38.118190 - 1:31:18 - step: 18680 acc: 0 loss: 1.1539 grad: 1.59e-01 flops: 3.59e+14 wps: 4.17e+04 iter: 0.5959 data: 0.0869 lr: 4.66e-05 mem: 47% pow: 667.549 W 0: INFO 26-04-29 17:06:52.214177 - 1:31:33 - step: 18690 acc: 0 loss: 1.59 grad: 1.50e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6484 data: 0.0634 lr: 4.66e-05 mem: 47% pow: 640.532 W 0: INFO 26-04-29 17:07:06.549299 - 1:31:47 - step: 18700 acc: 0 loss: 1.2682 grad: 1.51e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.6326 data: 0.0923 lr: 4.66e-05 mem: 47% pow: 634.718 W 0: INFO 26-04-29 17:07:27.508830 - 1:32:08 - step: 18710 acc: 0 loss: 1.1378 grad: 1.54e-01 flops: 2.69e+14 wps: 3.13e+04 iter: 0.6208 data: 0.0934 lr: 4.66e-05 mem: 54% pow: 643.766 W 0: INFO 26-04-29 17:07:41.162985 - 1:32:21 - step: 18720 acc: 0 loss: 1.4541 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7037 data: 0.084 lr: 4.65e-05 mem: 47% pow: 603.037 W 0: INFO 26-04-29 17:07:55.841243 - 1:32:36 - step: 18730 acc: 0 loss: 1.2236 grad: 1.45e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6047 data: 0.0895 lr: 4.65e-05 mem: 47% pow: 649.869 W 0: INFO 26-04-29 17:08:09.937007 - 1:32:50 - step: 18740 acc: 0 loss: 1.5081 grad: 1.83e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.69 data: 0.088 lr: 4.65e-05 mem: 47% pow: 595.428 W 0: INFO 26-04-29 17:08:25.436713 - 1:33:06 - step: 18750 acc: 0 loss: 1.6628 grad: 1.55e-01 flops: 3.64e+14 wps: 4.23e+04 iter: 0.7114 data: 0.0806 lr: 4.65e-05 mem: 47% pow: 598.401 W 0: INFO 26-04-29 17:08:39.113742 - 1:33:19 - step: 18760 acc: 0 loss: 1.2965 grad: 1.60e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6096 data: 0.084 lr: 4.65e-05 mem: 47% pow: 652.957 W 0: INFO 26-04-29 17:08:54.161282 - 1:33:34 - step: 18770 acc: 0 loss: 1.434 grad: 1.41e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.601 data: 0.0825 lr: 4.65e-05 mem: 47% pow: 662.259 W 0: INFO 26-04-29 17:09:08.563416 - 1:33:49 - step: 18780 acc: 0 loss: 1.2726 grad: 1.44e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5917 data: 0.0985 lr: 4.65e-05 mem: 47% pow: 657.619 W 0: INFO 26-04-29 17:09:22.585370 - 1:34:03 - step: 18790 acc: 0 loss: 1.6248 grad: 1.43e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.7212 data: 0.0893 lr: 4.64e-05 mem: 47% pow: 585.215 W 0: INFO 26-04-29 17:09:36.838958 - 1:34:17 - step: 18800 acc: 0 loss: 1.4658 grad: 1.51e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.592 data: 0.0825 lr: 4.64e-05 mem: 47% pow: 660.214 W 0: INFO 26-04-29 17:09:54.025672 - 1:34:34 - step: 18810 acc: 0 loss: 1.5854 grad: 1.48e-01 flops: 3.29e+14 wps: 3.81e+04 iter: 0.6332 data: 0.1332 lr: 4.64e-05 mem: 54% pow: 628.446 W 0: INFO 26-04-29 17:10:07.946723 - 1:34:48 - step: 18820 acc: 0 loss: 1.4009 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6851 data: 0.022 lr: 4.64e-05 mem: 47% pow: 648.898 W 0: INFO 26-04-29 17:10:22.391436 - 1:35:03 - step: 18830 acc: 0 loss: 1.2974 grad: 1.64e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6287 data: 0.0834 lr: 4.64e-05 mem: 47% pow: 644.027 W 0: INFO 26-04-29 17:10:37.727139 - 1:35:18 - step: 18840 acc: 0 loss: 1.5334 grad: 1.46e-01 flops: 3.68e+14 wps: 4.28e+04 iter: 0.6164 data: 0.0657 lr: 4.64e-05 mem: 47% pow: 659.603 W 0: INFO 26-04-29 17:10:51.587747 - 1:35:32 - step: 18850 acc: 0 loss: 1.225 grad: 1.55e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6115 data: 0.1164 lr: 4.64e-05 mem: 47% pow: 637.475 W 0: INFO 26-04-29 17:11:05.802170 - 1:35:46 - step: 18860 acc: 0 loss: 1.3096 grad: 1.40e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.5789 data: 0.1313 lr: 4.63e-05 mem: 47% pow: 648.567 W 0: INFO 26-04-29 17:11:19.562805 - 1:36:00 - step: 18870 acc: 0 loss: 1.288 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6762 data: 0.0913 lr: 4.63e-05 mem: 47% pow: 617.033 W 0: INFO 26-04-29 17:11:33.902173 - 1:36:14 - step: 18880 acc: 0 loss: 1.4982 grad: 1.50e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6067 data: 0.0896 lr: 4.63e-05 mem: 47% pow: 502.214 W 0: INFO 26-04-29 17:11:47.595283 - 1:36:28 - step: 18890 acc: 0 loss: 1.3807 grad: 1.62e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5873 data: 0.1018 lr: 4.63e-05 mem: 47% pow: 674.0 W 0: INFO 26-04-29 17:12:01.445139 - 1:36:42 - step: 18900 acc: 0 loss: 1.3534 grad: 1.50e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5995 data: 0.0919 lr: 4.63e-05 mem: 47% pow: 658.961 W 0: INFO 26-04-29 17:12:18.222954 - 1:36:59 - step: 18910 acc: 0 loss: 0.9961 grad: 1.50e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6199 data: 0.0851 lr: 4.63e-05 mem: 54% pow: 645.107 W 0: INFO 26-04-29 17:12:31.966398 - 1:37:12 - step: 18920 acc: 0 loss: 1.4707 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7347 data: 0.0911 lr: 4.62e-05 mem: 47% pow: 584.575 W 0: INFO 26-04-29 17:12:46.807407 - 1:37:27 - step: 18930 acc: 0 loss: 1.2998 grad: 1.61e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.5794 data: 0.1676 lr: 4.62e-05 mem: 47% pow: 623.081 W 0: INFO 26-04-29 17:13:01.539225 - 1:37:42 - step: 18940 acc: 0 loss: 1.4433 grad: 1.45e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 1.219 data: 0.0794 lr: 4.62e-05 mem: 47% pow: 431.405 W 0: INFO 26-04-29 17:13:15.566113 - 1:37:56 - step: 18950 acc: 0 loss: 1.9452 grad: 1.65e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5962 data: 0.0889 lr: 4.62e-05 mem: 47% pow: 658.045 W 0: INFO 26-04-29 17:13:30.945978 - 1:38:11 - step: 18960 acc: 0 loss: 1.4438 grad: 1.60e-01 flops: 3.67e+14 wps: 4.27e+04 iter: 0.6119 data: 0.0874 lr: 4.62e-05 mem: 47% pow: 650.051 W 0: INFO 26-04-29 17:13:44.747084 - 1:38:25 - step: 18970 acc: 0 loss: 1.0467 grad: 1.71e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6397 data: 0.0818 lr: 4.62e-05 mem: 47% pow: 643.324 W 0: INFO 26-04-29 17:13:58.687296 - 1:38:39 - step: 18980 acc: 0 loss: 1.2044 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6167 data: 0.0896 lr: 4.62e-05 mem: 47% pow: 646.264 W 0: INFO 26-04-29 17:14:12.916788 - 1:38:53 - step: 18990 acc: 0 loss: 1.611 grad: 1.50e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6558 data: 0.0466 lr: 4.61e-05 mem: 47% pow: 648.004 W 0: INFO 26-04-29 17:14:27.243117 - 1:39:08 - step: 19000 acc: 0 loss: 1.6339 grad: 1.55e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5863 data: 0.0895 lr: 4.61e-05 mem: 47% pow: 660.958 W 0: INFO 26-04-29 17:14:30.912291 - 1:39:11 - garbage collection 0: INFO 26-04-29 17:14:46.184022 - 1:39:26 - step: 19010 acc: 0 loss: 1.3139 grad: 1.53e-01 flops: 2.98e+14 wps: 3.46e+04 iter: 0.7936 data: 0.0904 lr: 4.61e-05 mem: 54% pow: 551.872 W 0: INFO 26-04-29 17:14:59.986382 - 1:39:40 - step: 19020 acc: 0 loss: 1.2768 grad: 1.67e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.7089 data: 0.0931 lr: 4.61e-05 mem: 47% pow: 589.23 W 0: INFO 26-04-29 17:15:13.833437 - 1:39:54 - step: 19030 acc: 0 loss: 1.1314 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.601 data: 0.0838 lr: 4.61e-05 mem: 47% pow: 681.364 W 0: INFO 26-04-29 17:15:27.924192 - 1:40:08 - step: 19040 acc: 0 loss: 1.3136 grad: 1.56e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5807 data: 0.1616 lr: 4.61e-05 mem: 47% pow: 630.47 W 0: INFO 26-04-29 17:15:42.084866 - 1:40:22 - step: 19050 acc: 0 loss: 1.3828 grad: 1.63e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6501 data: 0.0872 lr: 4.61e-05 mem: 47% pow: 616.378 W 0: INFO 26-04-29 17:15:56.074736 - 1:40:36 - step: 19060 acc: 0 loss: 1.5354 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6282 data: 0.0839 lr: 4.60e-05 mem: 47% pow: 642.372 W 0: INFO 26-04-29 17:16:10.367506 - 1:40:51 - step: 19070 acc: 0 loss: 1.6373 grad: 1.51e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6708 data: 0.077 lr: 4.60e-05 mem: 47% pow: 630.516 W 0: INFO 26-04-29 17:16:24.765303 - 1:41:05 - step: 19080 acc: 0 loss: 1.4169 grad: 1.59e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5934 data: 0.0934 lr: 4.60e-05 mem: 47% pow: 662.639 W 0: INFO 26-04-29 17:16:38.767555 - 1:41:19 - step: 19090 acc: 0 loss: 1.5624 grad: 1.48e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5845 data: 0.1066 lr: 4.60e-05 mem: 47% pow: 652.574 W 0: INFO 26-04-29 17:16:52.786549 - 1:41:33 - step: 19100 acc: 0 loss: 1.7484 grad: 1.58e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.7097 data: 0.1194 lr: 4.60e-05 mem: 47% pow: 584.472 W 0: INFO 26-04-29 17:17:09.774313 - 1:41:50 - step: 19110 acc: 0 loss: 1.0539 grad: 1.52e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.5896 data: 0.0874 lr: 4.60e-05 mem: 54% pow: 690.472 W 0: INFO 26-04-29 17:17:23.697799 - 1:42:04 - step: 19120 acc: 0 loss: 1.3743 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6164 data: 0.0784 lr: 4.60e-05 mem: 47% pow: 643.297 W 0: INFO 26-04-29 17:17:37.632995 - 1:42:18 - step: 19130 acc: 0 loss: 1.4185 grad: 1.77e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.634 data: 0.0791 lr: 4.59e-05 mem: 47% pow: 635.375 W 0: INFO 26-04-29 17:17:52.248852 - 1:42:33 - step: 19140 acc: 0 loss: 1.3134 grad: 1.66e-01 flops: 3.86e+14 wps: 4.49e+04 iter: 0.5825 data: 0.0947 lr: 4.59e-05 mem: 47% pow: 688.098 W 0: INFO 26-04-29 17:18:12.391152 - 1:42:53 - step: 19150 acc: 0 loss: 1.7078 grad: 1.48e-01 flops: 2.80e+14 wps: 3.25e+04 iter: 0.6531 data: 0.0768 lr: 4.59e-05 mem: 47% pow: 627.996 W 0: INFO 26-04-29 17:18:27.142681 - 1:43:07 - step: 19160 acc: 0 loss: 1.5336 grad: 1.48e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.6129 data: 0.0902 lr: 4.59e-05 mem: 47% pow: 649.045 W 0: INFO 26-04-29 17:18:40.893376 - 1:43:21 - step: 19170 acc: 0 loss: 1.3805 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.616 data: 0.0763 lr: 4.59e-05 mem: 47% pow: 652.36 W 0: INFO 26-04-29 17:18:57.992724 - 1:43:38 - step: 19180 acc: 0 loss: 1.5629 grad: 1.46e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.5796 data: 0.1126 lr: 4.59e-05 mem: 47% pow: 654.701 W 0: INFO 26-04-29 17:19:11.901812 - 1:43:52 - step: 19190 acc: 0 loss: 1.5036 grad: 1.49e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6252 data: 0.0819 lr: 4.58e-05 mem: 47% pow: 657.232 W 0: INFO 26-04-29 17:19:25.919770 - 1:44:06 - step: 19200 acc: 0 loss: 1.5133 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6749 data: 0.0033 lr: 4.58e-05 mem: 47% pow: 664.538 W 0: INFO 26-04-29 17:19:42.668773 - 1:44:23 - step: 19210 acc: 0 loss: 1.5554 grad: 1.58e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6231 data: 0.0989 lr: 4.58e-05 mem: 54% pow: 636.971 W 0: INFO 26-04-29 17:19:56.475728 - 1:44:37 - step: 19220 acc: 0 loss: 1.6839 grad: 1.79e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6687 data: 0.0125 lr: 4.58e-05 mem: 47% pow: 668.469 W 0: INFO 26-04-29 17:20:10.480378 - 1:44:51 - step: 19230 acc: 0 loss: 1.5132 grad: 1.46e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6081 data: 0.0923 lr: 4.58e-05 mem: 47% pow: 652.387 W 0: INFO 26-04-29 17:20:24.428093 - 1:45:05 - step: 19240 acc: 0 loss: 1.188 grad: 1.54e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6233 data: 0.0801 lr: 4.58e-05 mem: 47% pow: 658.279 W 0: INFO 26-04-29 17:20:38.474568 - 1:45:19 - step: 19250 acc: 0 loss: 1.3589 grad: 1.61e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6943 data: 0.0798 lr: 4.58e-05 mem: 47% pow: 609.531 W 0: INFO 26-04-29 17:20:52.647323 - 1:45:33 - step: 19260 acc: 0 loss: 1.4003 grad: 1.44e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5882 data: 0.0845 lr: 4.57e-05 mem: 47% pow: 658.792 W 0: INFO 26-04-29 17:21:06.384064 - 1:45:47 - step: 19270 acc: 0 loss: 1.1805 grad: 1.76e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6385 data: 0.0828 lr: 4.57e-05 mem: 47% pow: 636.716 W 0: INFO 26-04-29 17:21:20.347404 - 1:46:01 - step: 19280 acc: 0 loss: 1.338 grad: 1.56e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6262 data: 0.0853 lr: 4.57e-05 mem: 47% pow: 639.531 W 0: INFO 26-04-29 17:21:34.145697 - 1:46:14 - step: 19290 acc: 0 loss: 1.24 grad: 1.56e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6239 data: 0.0873 lr: 4.57e-05 mem: 47% pow: 656.866 W 0: INFO 26-04-29 17:21:48.406389 - 1:46:29 - step: 19300 acc: 0 loss: 1.3026 grad: 1.42e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5954 data: 0.0855 lr: 4.57e-05 mem: 47% pow: 656.854 W 0: INFO 26-04-29 17:22:05.203529 - 1:46:46 - step: 19310 acc: 0 loss: 1.1575 grad: 1.43e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6058 data: 0.0796 lr: 4.57e-05 mem: 54% pow: 656.755 W 0: INFO 26-04-29 17:22:19.132868 - 1:46:59 - step: 19320 acc: 0 loss: 1.5247 grad: 1.41e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.8202 data: 0.096 lr: 4.57e-05 mem: 47% pow: 538.202 W 0: INFO 26-04-29 17:22:33.188354 - 1:47:13 - step: 19330 acc: 0 loss: 1.298 grad: 1.49e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.7161 data: 0.0952 lr: 4.56e-05 mem: 47% pow: 587.265 W 0: INFO 26-04-29 17:22:47.303831 - 1:47:28 - step: 19340 acc: 0 loss: 1.7224 grad: 1.54e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6176 data: 0.0914 lr: 4.56e-05 mem: 47% pow: 645.363 W 0: INFO 26-04-29 17:23:01.657744 - 1:47:42 - step: 19350 acc: 0 loss: 1.3869 grad: 1.47e-01 flops: 3.93e+14 wps: 4.57e+04 iter: 0.5954 data: 0.0844 lr: 4.56e-05 mem: 47% pow: 654.809 W 0: INFO 26-04-29 17:23:15.529682 - 1:47:56 - step: 19360 acc: 0 loss: 1.3947 grad: 1.44e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5856 data: 0.0958 lr: 4.56e-05 mem: 47% pow: 658.871 W 0: INFO 26-04-29 17:23:29.468590 - 1:48:10 - step: 19370 acc: 0 loss: 1.7597 grad: 1.51e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6108 data: 0.0738 lr: 4.56e-05 mem: 47% pow: 661.661 W 0: INFO 26-04-29 17:23:43.229310 - 1:48:24 - step: 19380 acc: 0 loss: 1.44 grad: 1.44e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6003 data: 0.086 lr: 4.56e-05 mem: 47% pow: 668.08 W 0: INFO 26-04-29 17:23:56.765322 - 1:48:37 - step: 19390 acc: 0 loss: 1.6432 grad: 1.55e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6334 data: 0.0885 lr: 4.55e-05 mem: 47% pow: 636.035 W 0: INFO 26-04-29 17:24:10.673445 - 1:48:51 - step: 19400 acc: 0 loss: 1.3891 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6043 data: 0.0717 lr: 4.55e-05 mem: 47% pow: 657.135 W 0: INFO 26-04-29 17:24:27.526117 - 1:49:08 - step: 19410 acc: 0 loss: 1.2116 grad: 1.43e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6233 data: 0.0858 lr: 4.55e-05 mem: 54% pow: 657.275 W 0: INFO 26-04-29 17:24:41.261523 - 1:49:22 - step: 19420 acc: 0 loss: 1.6029 grad: 1.42e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6278 data: 0.0852 lr: 4.55e-05 mem: 47% pow: 641.342 W 0: INFO 26-04-29 17:24:54.926551 - 1:49:35 - step: 19430 acc: 0 loss: 1.7617 grad: 1.44e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6083 data: 0.0614 lr: 4.55e-05 mem: 47% pow: 672.864 W 0: INFO 26-04-29 17:25:08.731060 - 1:49:49 - step: 19440 acc: 0 loss: 1.409 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6284 data: 0.0857 lr: 4.55e-05 mem: 47% pow: 629.5 W 0: INFO 26-04-29 17:25:22.422776 - 1:50:03 - step: 19450 acc: 0 loss: 1.1286 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5904 data: 0.0887 lr: 4.55e-05 mem: 47% pow: 659.235 W 0: INFO 26-04-29 17:25:36.395008 - 1:50:17 - step: 19460 acc: 0 loss: 1.2493 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5805 data: 0.1111 lr: 4.54e-05 mem: 47% pow: 653.74 W 0: INFO 26-04-29 17:25:50.326390 - 1:50:31 - step: 19470 acc: 0 loss: 1.3016 grad: 1.51e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.5951 data: 0.0904 lr: 4.54e-05 mem: 47% pow: 667.241 W 0: INFO 26-04-29 17:26:04.084581 - 1:50:44 - step: 19480 acc: 0 loss: 1.392 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5797 data: 0.1055 lr: 4.54e-05 mem: 47% pow: 665.462 W 0: INFO 26-04-29 17:26:17.945589 - 1:50:58 - step: 19490 acc: 0 loss: 1.2578 grad: 1.58e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6439 data: 0.0818 lr: 4.54e-05 mem: 47% pow: 632.09 W 0: INFO 26-04-29 17:26:31.496770 - 1:51:12 - step: 19500 acc: 0 loss: 1.1365 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5953 data: 0.0821 lr: 4.54e-05 mem: 47% pow: 663.095 W 0: INFO 26-04-29 17:26:48.287696 - 1:51:29 - step: 19510 acc: 0 loss: 1.3215 grad: 1.60e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6248 data: 0.0576 lr: 4.54e-05 mem: 54% pow: 652.49 W 0: INFO 26-04-29 17:27:02.143000 - 1:51:42 - step: 19520 acc: 0 loss: 1.2615 grad: 1.52e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6565 data: 0.0851 lr: 4.54e-05 mem: 47% pow: 625.496 W 0: INFO 26-04-29 17:27:16.200251 - 1:51:56 - step: 19530 acc: 0 loss: 1.4628 grad: 1.46e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.644 data: 0.0883 lr: 4.53e-05 mem: 47% pow: 635.255 W 0: INFO 26-04-29 17:27:30.013900 - 1:52:10 - step: 19540 acc: 0 loss: 1.3362 grad: 1.55e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6163 data: 0.0879 lr: 4.53e-05 mem: 47% pow: 650.088 W 0: INFO 26-04-29 17:27:43.683190 - 1:52:24 - step: 19550 acc: 0 loss: 1.7117 grad: 1.56e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5785 data: 0.0963 lr: 4.53e-05 mem: 47% pow: 659.81 W 0: INFO 26-04-29 17:27:57.729733 - 1:52:38 - step: 19560 acc: 0 loss: 1.6858 grad: 1.54e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6314 data: 0.0871 lr: 4.53e-05 mem: 47% pow: 639.589 W 0: INFO 26-04-29 17:28:11.346723 - 1:52:52 - step: 19570 acc: 0 loss: 1.3533 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6334 data: 0.099 lr: 4.53e-05 mem: 47% pow: 639.418 W 0: INFO 26-04-29 17:28:24.996916 - 1:53:05 - step: 19580 acc: 0 loss: 1.4086 grad: 1.50e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5844 data: 0.0866 lr: 4.53e-05 mem: 47% pow: 672.119 W 0: INFO 26-04-29 17:28:39.001962 - 1:53:19 - step: 19590 acc: 0 loss: 1.5048 grad: 1.55e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6075 data: 0.087 lr: 4.53e-05 mem: 47% pow: 645.021 W 0: INFO 26-04-29 17:28:53.064725 - 1:53:33 - step: 19600 acc: 0 loss: 1.4288 grad: 1.49e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6143 data: 0.0941 lr: 4.52e-05 mem: 47% pow: 659.774 W 0: INFO 26-04-29 17:29:09.821164 - 1:53:50 - step: 19610 acc: 0 loss: 1.6201 grad: 1.76e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6692 data: 0.083 lr: 4.52e-05 mem: 54% pow: 610.209 W 0: INFO 26-04-29 17:29:23.846123 - 1:54:04 - step: 19620 acc: 0 loss: 1.3304 grad: 1.49e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6055 data: 0.0825 lr: 4.52e-05 mem: 47% pow: 671.197 W 0: INFO 26-04-29 17:29:37.547823 - 1:54:18 - step: 19630 acc: 0 loss: 1.4971 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5888 data: 0.0858 lr: 4.52e-05 mem: 47% pow: 664.682 W 0: INFO 26-04-29 17:29:51.302503 - 1:54:32 - step: 19640 acc: 0 loss: 1.1314 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5862 data: 0.0879 lr: 4.52e-05 mem: 47% pow: 665.676 W 0: INFO 26-04-29 17:30:05.211437 - 1:54:46 - step: 19650 acc: 0 loss: 1.3233 grad: 1.42e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6127 data: 0.0657 lr: 4.52e-05 mem: 47% pow: 657.956 W 0: INFO 26-04-29 17:30:18.691484 - 1:54:59 - step: 19660 acc: 0 loss: 1.1721 grad: 1.53e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6101 data: 0.0813 lr: 4.51e-05 mem: 47% pow: 656.642 W 0: INFO 26-04-29 17:30:32.904098 - 1:55:13 - step: 19670 acc: 0 loss: 1.4199 grad: 1.58e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.7124 data: 0.0994 lr: 4.51e-05 mem: 47% pow: 589.619 W 0: INFO 26-04-29 17:30:47.111216 - 1:55:27 - step: 19680 acc: 0 loss: 1.0059 grad: 1.51e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6823 data: 0.0872 lr: 4.51e-05 mem: 47% pow: 615.636 W 0: INFO 26-04-29 17:31:01.326111 - 1:55:42 - step: 19690 acc: 0 loss: 1.6132 grad: 1.54e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5829 data: 0.1295 lr: 4.51e-05 mem: 47% pow: 647.286 W 0: INFO 26-04-29 17:31:15.013451 - 1:55:55 - step: 19700 acc: 0 loss: 1.3268 grad: 1.43e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6361 data: 0.0784 lr: 4.51e-05 mem: 47% pow: 642.479 W 0: INFO 26-04-29 17:31:31.586506 - 1:56:12 - step: 19710 acc: 0 loss: 1.6686 grad: 1.46e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.5989 data: 0.0898 lr: 4.51e-05 mem: 54% pow: 661.845 W 0: INFO 26-04-29 17:31:45.191160 - 1:56:25 - step: 19720 acc: 0 loss: 1.4497 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6502 data: 0.1017 lr: 4.51e-05 mem: 47% pow: 623.007 W 0: INFO 26-04-29 17:31:59.118977 - 1:56:39 - step: 19730 acc: 0 loss: 1.2074 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6242 data: 0.057 lr: 4.50e-05 mem: 47% pow: 662.855 W 0: INFO 26-04-29 17:32:13.192232 - 1:56:53 - step: 19740 acc: 0 loss: 1.3333 grad: 1.49e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6293 data: 0.086 lr: 4.50e-05 mem: 47% pow: 639.074 W 0: INFO 26-04-29 17:32:26.890618 - 1:57:07 - step: 19750 acc: 0 loss: 1.4814 grad: 1.58e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.654 data: 0.0768 lr: 4.50e-05 mem: 47% pow: 627.522 W 0: INFO 26-04-29 17:32:40.320375 - 1:57:21 - step: 19760 acc: 0 loss: 1.7957 grad: 1.49e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5783 data: 0.0924 lr: 4.50e-05 mem: 47% pow: 685.715 W 0: INFO 26-04-29 17:32:54.357247 - 1:57:35 - step: 19770 acc: 0 loss: 1.5932 grad: 1.66e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6289 data: 0.087 lr: 4.50e-05 mem: 47% pow: 643.007 W 0: INFO 26-04-29 17:33:08.300941 - 1:57:49 - step: 19780 acc: 0 loss: 1.3432 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6113 data: 0.0843 lr: 4.50e-05 mem: 47% pow: 646.868 W 0: INFO 26-04-29 17:33:22.438308 - 1:58:03 - step: 19790 acc: 0 loss: 1.9931 grad: 1.51e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.5978 data: 0.0969 lr: 4.50e-05 mem: 47% pow: 649.954 W 0: INFO 26-04-29 17:33:36.876714 - 1:58:17 - step: 19800 acc: 0 loss: 1.7472 grad: 1.55e-01 flops: 3.93e+14 wps: 4.57e+04 iter: 0.5959 data: 0.0981 lr: 4.49e-05 mem: 47% pow: 654.035 W 0: INFO 26-04-29 17:33:53.497940 - 1:58:34 - step: 19810 acc: 0 loss: 1.6283 grad: 1.47e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6197 data: 0.0898 lr: 4.49e-05 mem: 54% pow: 639.023 W 0: INFO 26-04-29 17:34:07.266227 - 1:58:48 - step: 19820 acc: 0 loss: 1.2699 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.686 data: 0.0809 lr: 4.49e-05 mem: 47% pow: 612.847 W 0: INFO 26-04-29 17:34:20.869144 - 1:59:01 - step: 19830 acc: 0 loss: 1.2191 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.624 data: 0.0795 lr: 4.49e-05 mem: 47% pow: 649.721 W 0: INFO 26-04-29 17:34:34.639085 - 1:59:15 - step: 19840 acc: 0 loss: 1.5101 grad: 1.45e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6874 data: 0.1076 lr: 4.49e-05 mem: 47% pow: 594.63 W 0: INFO 26-04-29 17:34:48.669596 - 1:59:29 - step: 19850 acc: 0 loss: 1.3864 grad: 1.48e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5935 data: 0.0937 lr: 4.49e-05 mem: 47% pow: 663.451 W 0: INFO 26-04-29 17:35:02.713408 - 1:59:43 - step: 19860 acc: 0 loss: 1.7124 grad: 1.50e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5791 data: 0.092 lr: 4.48e-05 mem: 47% pow: 667.197 W 0: INFO 26-04-29 17:35:16.696870 - 1:59:57 - step: 19870 acc: 0 loss: 1.7598 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6053 data: 0.0942 lr: 4.48e-05 mem: 47% pow: 647.981 W 0: INFO 26-04-29 17:35:30.717045 - 2:00:11 - step: 19880 acc: 0 loss: 1.2409 grad: 1.45e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5777 data: 0.0949 lr: 4.48e-05 mem: 47% pow: 663.54 W 0: INFO 26-04-29 17:35:44.416629 - 2:00:25 - step: 19890 acc: 0 loss: 1.0669 grad: 1.49e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6038 data: 0.0835 lr: 4.48e-05 mem: 47% pow: 659.662 W 0: INFO 26-04-29 17:35:58.108855 - 2:00:38 - step: 19900 acc: 0 loss: 1.3614 grad: 1.62e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6337 data: 0.0663 lr: 4.48e-05 mem: 47% pow: 648.255 W 0: INFO 26-04-29 17:36:15.280568 - 2:00:56 - step: 19910 acc: 0 loss: 1.2127 grad: 1.56e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6253 data: 0.0854 lr: 4.48e-05 mem: 54% pow: 642.652 W 0: INFO 26-04-29 17:36:29.281748 - 2:01:10 - step: 19920 acc: 0 loss: 1.1819 grad: 1.48e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.7777 data: 0.0934 lr: 4.48e-05 mem: 47% pow: 554.907 W 0: INFO 26-04-29 17:36:43.233829 - 2:01:24 - step: 19930 acc: 0 loss: 1.6397 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6101 data: 0.0718 lr: 4.47e-05 mem: 47% pow: 665.371 W 0: INFO 26-04-29 17:36:57.140049 - 2:01:37 - step: 19940 acc: 0 loss: 1.3277 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7349 data: 0.061 lr: 4.47e-05 mem: 47% pow: 597.515 W 0: INFO 26-04-29 17:37:10.854346 - 2:01:51 - step: 19950 acc: 0 loss: 1.3749 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6403 data: 0.0532 lr: 4.47e-05 mem: 47% pow: 661.977 W 0: INFO 26-04-29 17:37:24.791917 - 2:02:05 - step: 19960 acc: 0 loss: 1.5399 grad: 1.58e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6213 data: 0.0813 lr: 4.47e-05 mem: 47% pow: 646.579 W 0: INFO 26-04-29 17:37:38.910503 - 2:02:19 - step: 19970 acc: 0 loss: 1.6433 grad: 1.81e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6296 data: 0.0717 lr: 4.47e-05 mem: 47% pow: 638.755 W 0: INFO 26-04-29 17:37:52.528228 - 2:02:33 - step: 19980 acc: 0 loss: 1.5431 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6053 data: 0.0934 lr: 4.47e-05 mem: 47% pow: 644.368 W 0: INFO 26-04-29 17:38:06.360144 - 2:02:47 - step: 19990 acc: 0 loss: 1.584 grad: 1.59e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5906 data: 0.0916 lr: 4.47e-05 mem: 47% pow: 673.717 W 0: INFO 26-04-29 17:38:20.331155 - 2:03:01 - step: 20000 acc: 0 loss: 1.2488 grad: 1.43e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.62 data: 0.0741 lr: 4.46e-05 mem: 47% pow: 675.549 W 0: INFO 26-04-29 17:38:20.334300 - 2:03:01 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000020000 0: INFO 26-04-29 17:38:20.340941 - 2:03:01 - Saving... 0: INFO 26-04-29 17:38:27.089587 - 2:03:07 - State dict saved! 0: INFO 26-04-29 17:38:27.211468 - 2:03:08 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000020000/train_state_00000.json 0: INFO 26-04-29 17:38:27.217604 - 2:03:08 - Train state saved ! 0: INFO 26-04-29 17:38:27.217883 - 2:03:08 - Cleaning up checkpoints... 0: INFO 26-04-29 17:38:27.218070 - 2:03:08 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000020000')] 0: INFO 26-04-29 17:38:27.218195 - 2:03:08 - Eval folders: [] 0: INFO 26-04-29 17:38:27.218324 - 2:03:08 - Other folders: [] 0: INFO 26-04-29 17:38:27.218466 - 2:03:08 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000015000')} 0: INFO 26-04-29 17:38:31.366522 - 2:03:12 - garbage collection 0: INFO 26-04-29 17:38:45.980455 - 2:03:26 - step: 20010 acc: 0 loss: 1.2698 grad: 1.48e-01 flops: 2.20e+14 wps: 2.56e+04 iter: 0.5961 data: 0.1097 lr: 4.46e-05 mem: 54% pow: 650.155 W 0: INFO 26-04-29 17:38:59.811612 - 2:03:40 - step: 20020 acc: 0 loss: 1.5719 grad: 1.43e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6454 data: 0.0777 lr: 4.46e-05 mem: 47% pow: 639.925 W 0: INFO 26-04-29 17:39:13.934213 - 2:03:54 - step: 20030 acc: 0 loss: 1.5913 grad: 1.50e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.7282 data: 0.0947 lr: 4.46e-05 mem: 47% pow: 577.531 W 0: INFO 26-04-29 17:39:27.792241 - 2:04:08 - step: 20040 acc: 0 loss: 1.6457 grad: 1.50e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5962 data: 0.0758 lr: 4.46e-05 mem: 47% pow: 660.913 W 0: INFO 26-04-29 17:39:41.686183 - 2:04:22 - step: 20050 acc: 0 loss: 1.5771 grad: 1.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6608 data: 0.0935 lr: 4.46e-05 mem: 47% pow: 621.837 W 0: INFO 26-04-29 17:39:55.637431 - 2:04:36 - step: 20060 acc: 0 loss: 1.6821 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6717 data: 0.0951 lr: 4.46e-05 mem: 47% pow: 612.967 W 0: INFO 26-04-29 17:40:09.437313 - 2:04:50 - step: 20070 acc: 0 loss: 1.6864 grad: 1.43e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6125 data: 0.0875 lr: 4.45e-05 mem: 47% pow: 650.018 W 0: INFO 26-04-29 17:40:23.383175 - 2:05:04 - step: 20080 acc: 0 loss: 1.1443 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6243 data: 0.0848 lr: 4.45e-05 mem: 47% pow: 648.304 W 0: INFO 26-04-29 17:40:37.454476 - 2:05:18 - step: 20090 acc: 0 loss: 1.3024 grad: 1.50e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5782 data: 0.1215 lr: 4.45e-05 mem: 47% pow: 647.131 W 0: INFO 26-04-29 17:40:51.491532 - 2:05:32 - step: 20100 acc: 0 loss: 1.0631 grad: 1.53e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6025 data: 0.0777 lr: 4.45e-05 mem: 47% pow: 663.069 W 0: INFO 26-04-29 17:41:08.251219 - 2:05:49 - step: 20110 acc: 0 loss: 1.4479 grad: 1.43e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5862 data: 0.0869 lr: 4.45e-05 mem: 54% pow: 661.761 W 0: INFO 26-04-29 17:41:22.244016 - 2:06:03 - step: 20120 acc: 0 loss: 1.4673 grad: 1.47e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.5781 data: 0.0979 lr: 4.45e-05 mem: 47% pow: 667.096 W 0: INFO 26-04-29 17:41:36.361960 - 2:06:17 - step: 20130 acc: 0 loss: 1.3177 grad: 1.45e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5796 data: 0.1084 lr: 4.44e-05 mem: 47% pow: 662.94 W 0: INFO 26-04-29 17:41:50.460698 - 2:06:31 - step: 20140 acc: 0 loss: 1.2628 grad: 1.69e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5913 data: 0.0949 lr: 4.44e-05 mem: 47% pow: 663.095 W 0: INFO 26-04-29 17:42:04.426367 - 2:06:45 - step: 20150 acc: 0 loss: 1.3667 grad: 1.44e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6013 data: 0.0902 lr: 4.44e-05 mem: 47% pow: 657.273 W 0: INFO 26-04-29 17:42:18.453578 - 2:06:59 - step: 20160 acc: 0 loss: 1.1642 grad: 1.55e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6109 data: 0.0826 lr: 4.44e-05 mem: 47% pow: 653.125 W 0: INFO 26-04-29 17:42:32.572628 - 2:07:13 - step: 20170 acc: 0 loss: 1.5127 grad: 1.42e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6577 data: 0.0915 lr: 4.44e-05 mem: 47% pow: 632.378 W 0: INFO 26-04-29 17:42:46.232175 - 2:07:27 - step: 20180 acc: 0 loss: 1.3366 grad: 1.49e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5819 data: 0.0956 lr: 4.44e-05 mem: 47% pow: 662.734 W 0: INFO 26-04-29 17:42:59.967213 - 2:07:40 - step: 20190 acc: 0 loss: 1.5091 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6217 data: 0.0862 lr: 4.44e-05 mem: 47% pow: 656.447 W 0: INFO 26-04-29 17:43:13.773931 - 2:07:54 - step: 20200 acc: 0 loss: 1.2436 grad: 1.60e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6122 data: 0.0902 lr: 4.43e-05 mem: 47% pow: 644.851 W 0: INFO 26-04-29 17:43:30.607213 - 2:08:11 - step: 20210 acc: 0 loss: 1.3212 grad: 1.49e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6197 data: 0.0944 lr: 4.43e-05 mem: 54% pow: 644.43 W 0: INFO 26-04-29 17:43:44.427803 - 2:08:25 - step: 20220 acc: 0 loss: 1.6001 grad: 1.46e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5789 data: 0.0955 lr: 4.43e-05 mem: 47% pow: 676.924 W 0: INFO 26-04-29 17:43:58.169091 - 2:08:38 - step: 20230 acc: 0 loss: 1.1142 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.579 data: 0.1087 lr: 4.43e-05 mem: 47% pow: 656.342 W 0: INFO 26-04-29 17:44:12.224509 - 2:08:53 - step: 20240 acc: 0 loss: 1.0128 grad: 1.47e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5978 data: 0.0911 lr: 4.43e-05 mem: 47% pow: 666.169 W 0: INFO 26-04-29 17:44:26.324771 - 2:09:07 - step: 20250 acc: 0 loss: 1.4873 grad: 1.53e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.632 data: 0.0766 lr: 4.43e-05 mem: 47% pow: 651.358 W 0: INFO 26-04-29 17:44:40.433455 - 2:09:21 - step: 20260 acc: 0 loss: 1.3067 grad: 2.27e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6061 data: 0.0911 lr: 4.43e-05 mem: 47% pow: 643.874 W 0: INFO 26-04-29 17:44:54.196165 - 2:09:34 - step: 20270 acc: 0 loss: 1.3513 grad: 1.43e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.591 data: 0.0917 lr: 4.42e-05 mem: 47% pow: 659.162 W 0: INFO 26-04-29 17:45:07.860456 - 2:09:48 - step: 20280 acc: 0 loss: 1.5953 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5958 data: 0.0888 lr: 4.42e-05 mem: 47% pow: 660.824 W 0: INFO 26-04-29 17:45:21.984112 - 2:10:02 - step: 20290 acc: 0 loss: 1.2058 grad: 1.57e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6138 data: 0.092 lr: 4.42e-05 mem: 47% pow: 647.649 W 0: INFO 26-04-29 17:45:35.655032 - 2:10:16 - step: 20300 acc: 0 loss: 1.537 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5924 data: 0.0849 lr: 4.42e-05 mem: 47% pow: 662.851 W 0: INFO 26-04-29 17:45:52.202593 - 2:10:32 - step: 20310 acc: 0 loss: 1.2311 grad: 1.55e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.5973 data: 0.0835 lr: 4.42e-05 mem: 54% pow: 659.083 W 0: INFO 26-04-29 17:46:06.178710 - 2:10:46 - step: 20320 acc: 0 loss: 1.3116 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6189 data: 0.0907 lr: 4.42e-05 mem: 47% pow: 647.759 W 0: INFO 26-04-29 17:46:20.397217 - 2:11:01 - step: 20330 acc: 0 loss: 1.3973 grad: 1.50e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6956 data: 0.0038 lr: 4.42e-05 mem: 47% pow: 648.852 W 0: INFO 26-04-29 17:46:34.343247 - 2:11:15 - step: 20340 acc: 0 loss: 1.4886 grad: 1.42e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6227 data: 0.0838 lr: 4.41e-05 mem: 47% pow: 652.328 W 0: INFO 26-04-29 17:46:48.130915 - 2:11:28 - step: 20350 acc: 0 loss: 1.2992 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7083 data: 0.0802 lr: 4.41e-05 mem: 47% pow: 602.46 W 0: INFO 26-04-29 17:47:02.205700 - 2:11:43 - step: 20360 acc: 0 loss: 1.5795 grad: 1.47e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6024 data: 0.0895 lr: 4.41e-05 mem: 47% pow: 656.32 W 0: INFO 26-04-29 17:47:15.793957 - 2:11:56 - step: 20370 acc: 0 loss: 1.5817 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6649 data: 0.0607 lr: 4.41e-05 mem: 47% pow: 639.934 W 0: INFO 26-04-29 17:47:29.813660 - 2:12:10 - step: 20380 acc: 0 loss: 1.6268 grad: 1.55e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5977 data: 0.0965 lr: 4.41e-05 mem: 47% pow: 647.646 W 0: INFO 26-04-29 17:47:43.418278 - 2:12:24 - step: 20390 acc: 0 loss: 0.9583 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.616 data: 0.0824 lr: 4.41e-05 mem: 47% pow: 647.887 W 0: INFO 26-04-29 17:47:57.324800 - 2:12:38 - step: 20400 acc: 0 loss: 1.4891 grad: 1.40e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6146 data: 0.0891 lr: 4.40e-05 mem: 47% pow: 649.106 W 0: INFO 26-04-29 17:48:14.507862 - 2:12:55 - step: 20410 acc: 0 loss: 1.7773 grad: 1.44e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.6262 data: 0.0937 lr: 4.40e-05 mem: 54% pow: 637.281 W 0: INFO 26-04-29 17:48:28.157377 - 2:13:08 - step: 20420 acc: 0 loss: 1.2605 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.579 data: 0.1004 lr: 4.40e-05 mem: 47% pow: 653.085 W 0: INFO 26-04-29 17:48:42.283547 - 2:13:23 - step: 20430 acc: 0 loss: 1.5725 grad: 1.48e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5832 data: 0.1 lr: 4.40e-05 mem: 47% pow: 653.812 W 0: INFO 26-04-29 17:48:56.196982 - 2:13:36 - step: 20440 acc: 0 loss: 1.388 grad: 1.44e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6092 data: 0.1011 lr: 4.40e-05 mem: 47% pow: 666.525 W 0: INFO 26-04-29 17:49:10.357431 - 2:13:51 - step: 20450 acc: 0 loss: 1.4363 grad: 1.50e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6303 data: 0.0898 lr: 4.40e-05 mem: 47% pow: 637.677 W 0: INFO 26-04-29 17:49:24.712065 - 2:14:05 - step: 20460 acc: 0 loss: 1.5054 grad: 1.50e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5943 data: 0.0946 lr: 4.40e-05 mem: 47% pow: 661.752 W 0: INFO 26-04-29 17:49:38.232641 - 2:14:19 - step: 20470 acc: 0 loss: 1.2783 grad: 1.54e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5828 data: 0.0919 lr: 4.39e-05 mem: 47% pow: 659.896 W 0: INFO 26-04-29 17:49:52.105879 - 2:14:32 - step: 20480 acc: 0 loss: 1.4557 grad: 1.46e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5894 data: 0.0968 lr: 4.39e-05 mem: 47% pow: 667.572 W 0: INFO 26-04-29 17:50:06.210396 - 2:14:47 - step: 20490 acc: 0 loss: 1.7552 grad: 1.50e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6213 data: 0.0878 lr: 4.39e-05 mem: 47% pow: 645.902 W 0: INFO 26-04-29 17:50:19.816905 - 2:15:00 - step: 20500 acc: 0 loss: 1.2403 grad: 1.48e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5981 data: 0.0954 lr: 4.39e-05 mem: 47% pow: 644.774 W 0: INFO 26-04-29 17:50:37.055865 - 2:15:17 - step: 20510 acc: 0 loss: 1.1978 grad: 1.43e-01 flops: 3.28e+14 wps: 3.80e+04 iter: 0.6631 data: 0.0738 lr: 4.39e-05 mem: 54% pow: 631.145 W 0: INFO 26-04-29 17:50:51.025801 - 2:15:31 - step: 20520 acc: 0 loss: 1.6405 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6792 data: 0.0993 lr: 4.39e-05 mem: 47% pow: 609.284 W 0: INFO 26-04-29 17:51:04.615228 - 2:15:45 - step: 20530 acc: 0 loss: 1.9709 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.602 data: 0.0714 lr: 4.39e-05 mem: 47% pow: 663.805 W 0: INFO 26-04-29 17:51:18.701328 - 2:15:59 - step: 20540 acc: 0 loss: 1.4399 grad: 1.56e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.617 data: 0.0864 lr: 4.38e-05 mem: 47% pow: 654.179 W 0: INFO 26-04-29 17:51:32.517913 - 2:16:13 - step: 20550 acc: 0 loss: 1.4429 grad: 1.82e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.733 data: 0.0957 lr: 4.38e-05 mem: 47% pow: 582.389 W 0: INFO 26-04-29 17:51:46.186290 - 2:16:26 - step: 20560 acc: 0 loss: 1.204 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.614 data: 0.0836 lr: 4.38e-05 mem: 47% pow: 642.815 W 0: INFO 26-04-29 17:52:00.185121 - 2:16:40 - step: 20570 acc: 0 loss: 1.6177 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6003 data: 0.0867 lr: 4.38e-05 mem: 47% pow: 660.034 W 0: INFO 26-04-29 17:52:13.961555 - 2:16:54 - step: 20580 acc: 0 loss: 1.4407 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6163 data: 0.0846 lr: 4.38e-05 mem: 47% pow: 646.877 W 0: INFO 26-04-29 17:52:28.234207 - 2:17:09 - step: 20590 acc: 0 loss: 1.4722 grad: 1.43e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6148 data: 0.0748 lr: 4.38e-05 mem: 47% pow: 657.121 W 0: INFO 26-04-29 17:52:42.039394 - 2:17:22 - step: 20600 acc: 0 loss: 1.2998 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.658 data: 0.0818 lr: 4.37e-05 mem: 47% pow: 624.882 W 0: INFO 26-04-29 17:52:58.845281 - 2:17:39 - step: 20610 acc: 0 loss: 1.404 grad: 1.70e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.62 data: 0.0851 lr: 4.37e-05 mem: 54% pow: 651.093 W 0: INFO 26-04-29 17:53:12.705162 - 2:17:53 - step: 20620 acc: 0 loss: 1.2086 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6195 data: 0.0927 lr: 4.37e-05 mem: 47% pow: 647.965 W 0: INFO 26-04-29 17:53:26.657580 - 2:18:07 - step: 20630 acc: 0 loss: 1.4123 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6056 data: 0.0884 lr: 4.37e-05 mem: 47% pow: 654.983 W 0: INFO 26-04-29 17:53:40.433886 - 2:18:21 - step: 20640 acc: 0 loss: 1.4944 grad: 1.41e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6378 data: 0.0713 lr: 4.37e-05 mem: 47% pow: 652.638 W 0: INFO 26-04-29 17:53:54.585608 - 2:18:35 - step: 20650 acc: 0 loss: 1.5166 grad: 1.43e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.8729 data: 0.0803 lr: 4.37e-05 mem: 47% pow: 510.552 W 0: INFO 26-04-29 17:54:08.471774 - 2:18:49 - step: 20660 acc: 0 loss: 1.2809 grad: 1.44e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5859 data: 0.0858 lr: 4.37e-05 mem: 47% pow: 666.27 W 0: INFO 26-04-29 17:54:22.173463 - 2:19:02 - step: 20670 acc: 0 loss: 1.6885 grad: 1.41e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5938 data: 0.076 lr: 4.36e-05 mem: 47% pow: 669.958 W 0: INFO 26-04-29 17:54:35.817641 - 2:19:16 - step: 20680 acc: 0 loss: 1.2298 grad: 1.46e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6322 data: 0.0893 lr: 4.36e-05 mem: 47% pow: 635.872 W 0: INFO 26-04-29 17:54:49.573673 - 2:19:30 - step: 20690 acc: 0 loss: 1.4846 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6099 data: 0.0842 lr: 4.36e-05 mem: 47% pow: 656.718 W 0: INFO 26-04-29 17:55:03.509831 - 2:19:44 - step: 20700 acc: 0 loss: 1.8059 grad: 1.45e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.5851 data: 0.0986 lr: 4.36e-05 mem: 47% pow: 666.231 W 0: INFO 26-04-29 17:55:20.265061 - 2:20:01 - step: 20710 acc: 0 loss: 1.5025 grad: 1.51e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.586 data: 0.0873 lr: 4.36e-05 mem: 54% pow: 665.539 W 0: INFO 26-04-29 17:55:33.853981 - 2:20:14 - step: 20720 acc: 0 loss: 1.4944 grad: 1.47e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6047 data: 0.0857 lr: 4.36e-05 mem: 47% pow: 667.958 W 0: INFO 26-04-29 17:55:47.886375 - 2:20:28 - step: 20730 acc: 0 loss: 1.4269 grad: 1.44e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5952 data: 0.0869 lr: 4.36e-05 mem: 47% pow: 655.902 W 0: INFO 26-04-29 17:56:01.670039 - 2:20:42 - step: 20740 acc: 0 loss: 1.3474 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5906 data: 0.0835 lr: 4.35e-05 mem: 47% pow: 664.673 W 0: INFO 26-04-29 17:56:15.359255 - 2:20:56 - step: 20750 acc: 0 loss: 1.5399 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5926 data: 0.0856 lr: 4.35e-05 mem: 47% pow: 667.89 W 0: INFO 26-04-29 17:56:29.280851 - 2:21:10 - step: 20760 acc: 0 loss: 1.0444 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6264 data: 0.0848 lr: 4.35e-05 mem: 47% pow: 644.035 W 0: INFO 26-04-29 17:56:43.048027 - 2:21:23 - step: 20770 acc: 0 loss: 1.5809 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6035 data: 0.0857 lr: 4.35e-05 mem: 47% pow: 665.49 W 0: INFO 26-04-29 17:56:56.931801 - 2:21:37 - step: 20780 acc: 0 loss: 0.9799 grad: 1.50e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6233 data: 0.0763 lr: 4.35e-05 mem: 47% pow: 657.521 W 0: INFO 26-04-29 17:57:10.505765 - 2:21:51 - step: 20790 acc: 0 loss: 1.4401 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5918 data: 0.0896 lr: 4.35e-05 mem: 47% pow: 662.268 W 0: INFO 26-04-29 17:57:24.234479 - 2:22:05 - step: 20800 acc: 0 loss: 1.79 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6453 data: 0.0845 lr: 4.35e-05 mem: 47% pow: 641.775 W 0: INFO 26-04-29 17:57:40.804762 - 2:22:21 - step: 20810 acc: 0 loss: 1.4807 grad: 1.42e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6149 data: 0.0869 lr: 4.34e-05 mem: 54% pow: 649.357 W 0: INFO 26-04-29 17:57:54.439299 - 2:22:35 - step: 20820 acc: 0 loss: 1.2925 grad: 1.50e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.633 data: 0.0822 lr: 4.34e-05 mem: 47% pow: 649.639 W 0: INFO 26-04-29 17:58:08.100440 - 2:22:48 - step: 20830 acc: 0 loss: 1.6633 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6042 data: 0.088 lr: 4.34e-05 mem: 47% pow: 660.265 W 0: INFO 26-04-29 17:58:21.814469 - 2:23:02 - step: 20840 acc: 0 loss: 1.2371 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6115 data: 0.0798 lr: 4.34e-05 mem: 47% pow: 658.609 W 0: INFO 26-04-29 17:58:35.348081 - 2:23:16 - step: 20850 acc: 0 loss: 1.3267 grad: 1.44e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.5901 data: 0.0886 lr: 4.34e-05 mem: 47% pow: 664.243 W 0: INFO 26-04-29 17:58:49.155989 - 2:23:29 - step: 20860 acc: 0 loss: 1.1263 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.583 data: 0.0853 lr: 4.34e-05 mem: 47% pow: 676.147 W 0: INFO 26-04-29 17:59:03.295291 - 2:23:44 - step: 20870 acc: 0 loss: 1.4262 grad: 1.45e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.579 data: 0.0871 lr: 4.33e-05 mem: 47% pow: 676.133 W 0: INFO 26-04-29 17:59:17.319581 - 2:23:58 - step: 20880 acc: 0 loss: 1.4592 grad: 1.49e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.602 data: 0.0686 lr: 4.33e-05 mem: 47% pow: 665.009 W 0: INFO 26-04-29 17:59:30.928613 - 2:24:11 - step: 20890 acc: 0 loss: 1.3453 grad: 1.43e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6525 data: 0.0718 lr: 4.33e-05 mem: 47% pow: 634.787 W 0: INFO 26-04-29 17:59:44.856763 - 2:24:25 - step: 20900 acc: 0 loss: 1.456 grad: 1.44e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.607 data: 0.0853 lr: 4.33e-05 mem: 47% pow: 654.355 W 0: INFO 26-04-29 18:00:01.380140 - 2:24:42 - step: 20910 acc: 0 loss: 1.5225 grad: 1.37e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6025 data: 0.0908 lr: 4.33e-05 mem: 54% pow: 644.644 W 0: INFO 26-04-29 18:00:15.376861 - 2:24:56 - step: 20920 acc: 0 loss: 1.5049 grad: 1.56e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6211 data: 0.0691 lr: 4.33e-05 mem: 47% pow: 649.943 W 0: INFO 26-04-29 18:00:29.342624 - 2:25:10 - step: 20930 acc: 0 loss: 1.3873 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5843 data: 0.0924 lr: 4.33e-05 mem: 47% pow: 658.724 W 0: INFO 26-04-29 18:00:42.906483 - 2:25:23 - step: 20940 acc: 0 loss: 1.2066 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6426 data: 0.0878 lr: 4.32e-05 mem: 47% pow: 632.38 W 0: INFO 26-04-29 18:00:56.863994 - 2:25:37 - step: 20950 acc: 0 loss: 1.3473 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6412 data: 0.0883 lr: 4.32e-05 mem: 47% pow: 633.272 W 0: INFO 26-04-29 18:01:10.750401 - 2:25:51 - step: 20960 acc: 0 loss: 1.1569 grad: 1.62e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6076 data: 0.0771 lr: 4.32e-05 mem: 47% pow: 659.643 W 0: INFO 26-04-29 18:01:24.444799 - 2:26:05 - step: 20970 acc: 0 loss: 1.2408 grad: 1.45e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5971 data: 0.0906 lr: 4.32e-05 mem: 47% pow: 666.257 W 0: INFO 26-04-29 18:01:38.283359 - 2:26:19 - step: 20980 acc: 0 loss: 1.5733 grad: 1.42e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5993 data: 0.0783 lr: 4.32e-05 mem: 47% pow: 662.463 W 0: INFO 26-04-29 18:01:52.191821 - 2:26:32 - step: 20990 acc: 0 loss: 1.7606 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5821 data: 0.1023 lr: 4.32e-05 mem: 47% pow: 662.917 W 0: INFO 26-04-29 18:02:05.917212 - 2:26:46 - step: 21000 acc: 0 loss: 1.2575 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6266 data: 0.0784 lr: 4.32e-05 mem: 47% pow: 650.858 W 0: INFO 26-04-29 18:02:09.634998 - 2:26:50 - garbage collection 0: INFO 26-04-29 18:02:24.109530 - 2:27:04 - step: 21010 acc: 0 loss: 1.6944 grad: 1.42e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.6221 data: 0.071 lr: 4.31e-05 mem: 54% pow: 666.597 W 0: INFO 26-04-29 18:02:37.857917 - 2:27:18 - step: 21020 acc: 0 loss: 1.3453 grad: 1.59e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.589 data: 0.085 lr: 4.31e-05 mem: 47% pow: 667.161 W 0: INFO 26-04-29 18:02:51.584004 - 2:27:32 - step: 21030 acc: 0 loss: 1.1496 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6076 data: 0.0824 lr: 4.31e-05 mem: 47% pow: 656.606 W 0: INFO 26-04-29 18:03:05.185077 - 2:27:45 - step: 21040 acc: 0 loss: 1.7765 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6235 data: 0.0852 lr: 4.31e-05 mem: 47% pow: 647.756 W 0: INFO 26-04-29 18:03:18.977379 - 2:27:59 - step: 21050 acc: 0 loss: 1.3769 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6711 data: 0.079 lr: 4.31e-05 mem: 47% pow: 618.42 W 0: INFO 26-04-29 18:03:32.918895 - 2:28:13 - step: 21060 acc: 0 loss: 1.2236 grad: 1.45e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6145 data: 0.0882 lr: 4.31e-05 mem: 47% pow: 655.384 W 0: INFO 26-04-29 18:03:46.674546 - 2:28:27 - step: 21070 acc: 0 loss: 1.3177 grad: 1.40e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.58 data: 0.1046 lr: 4.30e-05 mem: 47% pow: 667.024 W 0: INFO 26-04-29 18:04:00.190646 - 2:28:40 - step: 21080 acc: 0 loss: 1.088 grad: 1.45e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6069 data: 0.0739 lr: 4.30e-05 mem: 47% pow: 659.569 W 0: INFO 26-04-29 18:04:13.891261 - 2:28:54 - step: 21090 acc: 0 loss: 1.6708 grad: 1.44e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.598 data: 0.0819 lr: 4.30e-05 mem: 47% pow: 669.654 W 0: INFO 26-04-29 18:04:27.609331 - 2:29:08 - step: 21100 acc: 0 loss: 1.4269 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5797 data: 0.1145 lr: 4.30e-05 mem: 47% pow: 656.083 W 0: INFO 26-04-29 18:04:44.292452 - 2:29:25 - step: 21110 acc: 0 loss: 1.5689 grad: 1.48e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6335 data: 0.092 lr: 4.30e-05 mem: 54% pow: 637.963 W 0: INFO 26-04-29 18:04:58.155458 - 2:29:38 - step: 21120 acc: 0 loss: 1.6989 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.602 data: 0.083 lr: 4.30e-05 mem: 47% pow: 673.257 W 0: INFO 26-04-29 18:05:11.929776 - 2:29:52 - step: 21130 acc: 0 loss: 1.1104 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6173 data: 0.0558 lr: 4.30e-05 mem: 47% pow: 668.534 W 0: INFO 26-04-29 18:05:25.729988 - 2:30:06 - step: 21140 acc: 0 loss: 1.1154 grad: 1.49e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6095 data: 0.0896 lr: 4.29e-05 mem: 47% pow: 643.207 W 0: INFO 26-04-29 18:05:39.576962 - 2:30:20 - step: 21150 acc: 0 loss: 1.5273 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5813 data: 0.093 lr: 4.29e-05 mem: 47% pow: 669.211 W 0: INFO 26-04-29 18:05:53.378144 - 2:30:34 - step: 21160 acc: 0 loss: 1.0692 grad: 1.45e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5826 data: 0.1254 lr: 4.29e-05 mem: 47% pow: 648.61 W 0: INFO 26-04-29 18:06:07.019749 - 2:30:47 - step: 21170 acc: 0 loss: 1.5757 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5931 data: 0.09 lr: 4.29e-05 mem: 47% pow: 675.099 W 0: INFO 26-04-29 18:06:21.352183 - 2:31:02 - step: 21180 acc: 0 loss: 1.3944 grad: 1.57e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5907 data: 0.0873 lr: 4.29e-05 mem: 47% pow: 662.584 W 0: INFO 26-04-29 18:06:35.057733 - 2:31:15 - step: 21190 acc: 0 loss: 1.249 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5943 data: 0.0858 lr: 4.29e-05 mem: 47% pow: 656.852 W 0: INFO 26-04-29 18:06:48.770502 - 2:31:29 - step: 21200 acc: 0 loss: 1.3772 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5971 data: 0.0821 lr: 4.29e-05 mem: 47% pow: 663.698 W 0: INFO 26-04-29 18:07:05.230957 - 2:31:46 - step: 21210 acc: 0 loss: 1.1576 grad: 1.40e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5879 data: 0.0886 lr: 4.28e-05 mem: 54% pow: 662.527 W 0: INFO 26-04-29 18:07:18.897492 - 2:31:59 - step: 21220 acc: 0 loss: 1.0851 grad: 1.51e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7304 data: 0.0861 lr: 4.28e-05 mem: 47% pow: 585.131 W 0: INFO 26-04-29 18:07:32.729582 - 2:32:13 - step: 21230 acc: 0 loss: 1.2681 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.612 data: 0.0878 lr: 4.28e-05 mem: 47% pow: 644.176 W 0: INFO 26-04-29 18:07:46.308006 - 2:32:27 - step: 21240 acc: 0 loss: 1.3324 grad: 1.49e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5908 data: 0.0842 lr: 4.28e-05 mem: 47% pow: 675.805 W 0: INFO 26-04-29 18:08:00.130392 - 2:32:40 - step: 21250 acc: 0 loss: 1.4938 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6154 data: 0.086 lr: 4.28e-05 mem: 47% pow: 642.474 W 0: INFO 26-04-29 18:08:13.898275 - 2:32:54 - step: 21260 acc: 0 loss: 1.297 grad: 1.43e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6623 data: 0.0859 lr: 4.28e-05 mem: 47% pow: 623.472 W 0: INFO 26-04-29 18:08:27.588666 - 2:33:08 - step: 21270 acc: 0 loss: 1.4792 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6014 data: 0.0863 lr: 4.28e-05 mem: 47% pow: 671.889 W 0: INFO 26-04-29 18:08:41.413660 - 2:33:22 - step: 21280 acc: 0 loss: 1.2599 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6149 data: 0.0805 lr: 4.27e-05 mem: 47% pow: 660.702 W 0: INFO 26-04-29 18:08:55.053222 - 2:33:35 - step: 21290 acc: 0 loss: 1.4837 grad: 1.34e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6474 data: 0.0666 lr: 4.27e-05 mem: 47% pow: 639.435 W 0: INFO 26-04-29 18:09:08.606217 - 2:33:49 - step: 21300 acc: 0 loss: 1.3945 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.598 data: 0.0882 lr: 4.27e-05 mem: 47% pow: 676.774 W 0: INFO 26-04-29 18:09:25.425255 - 2:34:06 - step: 21310 acc: 0 loss: 1.4611 grad: 1.49e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6057 data: 0.0805 lr: 4.27e-05 mem: 54% pow: 659.684 W 0: INFO 26-04-29 18:09:39.312397 - 2:34:20 - step: 21320 acc: 0 loss: 1.4981 grad: 1.45e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5908 data: 0.0905 lr: 4.27e-05 mem: 47% pow: 659.318 W 0: INFO 26-04-29 18:09:52.833978 - 2:34:33 - step: 21330 acc: 0 loss: 1.6767 grad: 1.39e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5938 data: 0.0861 lr: 4.27e-05 mem: 47% pow: 662.6 W 0: INFO 26-04-29 18:10:06.510322 - 2:34:47 - step: 21340 acc: 0 loss: 1.044 grad: 1.39e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6037 data: 0.0763 lr: 4.26e-05 mem: 47% pow: 665.101 W 0: INFO 26-04-29 18:10:20.236284 - 2:35:01 - step: 21350 acc: 0 loss: 1.292 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.674 data: 0.0888 lr: 4.26e-05 mem: 47% pow: 606.2 W 0: INFO 26-04-29 18:10:33.923232 - 2:35:14 - step: 21360 acc: 0 loss: 1.259 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5997 data: 0.074 lr: 4.26e-05 mem: 47% pow: 669.88 W 0: INFO 26-04-29 18:10:47.429526 - 2:35:28 - step: 21370 acc: 0 loss: 1.6242 grad: 1.41e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5829 data: 0.0901 lr: 4.26e-05 mem: 47% pow: 678.434 W 0: INFO 26-04-29 18:11:01.644503 - 2:35:42 - step: 21380 acc: 0 loss: 1.6535 grad: 1.43e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.5953 data: 0.0867 lr: 4.26e-05 mem: 47% pow: 658.596 W 0: INFO 26-04-29 18:11:15.308237 - 2:35:56 - step: 21390 acc: 0 loss: 1.2523 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6174 data: 0.0756 lr: 4.26e-05 mem: 47% pow: 648.708 W 0: INFO 26-04-29 18:11:28.909408 - 2:36:09 - step: 21400 acc: 0 loss: 1.5344 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6252 data: 0.0843 lr: 4.26e-05 mem: 47% pow: 639.857 W 0: INFO 26-04-29 18:11:45.640352 - 2:36:26 - step: 21410 acc: 0 loss: 1.34 grad: 1.47e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5978 data: 0.0894 lr: 4.25e-05 mem: 54% pow: 663.997 W 0: INFO 26-04-29 18:11:59.365167 - 2:36:40 - step: 21420 acc: 0 loss: 1.328 grad: 1.41e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6087 data: 0.0805 lr: 4.25e-05 mem: 47% pow: 663.089 W 0: INFO 26-04-29 18:12:12.981526 - 2:36:53 - step: 21430 acc: 0 loss: 1.4028 grad: 1.39e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5976 data: 0.088 lr: 4.25e-05 mem: 47% pow: 651.947 W 0: INFO 26-04-29 18:12:26.715449 - 2:37:07 - step: 21440 acc: 0 loss: 1.3923 grad: 1.43e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5962 data: 0.0864 lr: 4.25e-05 mem: 47% pow: 657.941 W 0: INFO 26-04-29 18:12:40.350196 - 2:37:21 - step: 21450 acc: 0 loss: 1.5317 grad: 1.43e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6088 data: 0.0807 lr: 4.25e-05 mem: 47% pow: 658.936 W 0: INFO 26-04-29 18:12:54.099822 - 2:37:34 - step: 21460 acc: 0 loss: 1.4075 grad: 1.45e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.716 data: 0.0845 lr: 4.25e-05 mem: 47% pow: 586.607 W 0: INFO 26-04-29 18:13:07.538639 - 2:37:48 - step: 21470 acc: 0 loss: 1.2651 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5996 data: 0.0865 lr: 4.25e-05 mem: 47% pow: 661.582 W 0: INFO 26-04-29 18:13:21.113659 - 2:38:01 - step: 21480 acc: 0 loss: 1.2184 grad: 1.42e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6041 data: 0.0928 lr: 4.24e-05 mem: 47% pow: 654.96 W 0: INFO 26-04-29 18:13:34.865223 - 2:38:15 - step: 21490 acc: 0 loss: 1.4771 grad: 1.43e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6969 data: 0.0801 lr: 4.24e-05 mem: 47% pow: 611.262 W 0: INFO 26-04-29 18:13:48.430017 - 2:38:29 - step: 21500 acc: 0 loss: 1.6095 grad: 1.39e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6068 data: 0.0867 lr: 4.24e-05 mem: 47% pow: 655.438 W 0: INFO 26-04-29 18:14:05.293039 - 2:38:46 - step: 21510 acc: 0 loss: 1.2431 grad: 1.65e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6135 data: 0.0771 lr: 4.24e-05 mem: 54% pow: 653.059 W 0: INFO 26-04-29 18:14:18.893748 - 2:38:59 - step: 21520 acc: 0 loss: 1.2098 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6176 data: 0.0765 lr: 4.24e-05 mem: 47% pow: 657.989 W 0: INFO 26-04-29 18:14:32.289363 - 2:39:13 - step: 21530 acc: 0 loss: 1.361 grad: 1.49e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5842 data: 0.0912 lr: 4.24e-05 mem: 47% pow: 660.827 W 0: INFO 26-04-29 18:14:46.026064 - 2:39:26 - step: 21540 acc: 0 loss: 1.3208 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6819 data: 0.0033 lr: 4.23e-05 mem: 47% pow: 666.992 W 0: INFO 26-04-29 18:14:59.740906 - 2:39:40 - step: 21550 acc: 0 loss: 1.2861 grad: 1.45e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5822 data: 0.0915 lr: 4.23e-05 mem: 47% pow: 663.748 W 0: INFO 26-04-29 18:15:13.439827 - 2:39:54 - step: 21560 acc: 0 loss: 1.4204 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5959 data: 0.09 lr: 4.23e-05 mem: 47% pow: 658.047 W 0: INFO 26-04-29 18:15:27.003611 - 2:40:07 - step: 21570 acc: 0 loss: 1.4089 grad: 1.43e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5817 data: 0.0994 lr: 4.23e-05 mem: 47% pow: 665.17 W 0: INFO 26-04-29 18:15:40.819633 - 2:40:21 - step: 21580 acc: 0 loss: 1.4429 grad: 1.57e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6547 data: 0.0804 lr: 4.23e-05 mem: 47% pow: 630.901 W 0: INFO 26-04-29 18:15:54.311698 - 2:40:35 - step: 21590 acc: 0 loss: 1.463 grad: 1.48e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5959 data: 0.0938 lr: 4.23e-05 mem: 47% pow: 662.563 W 0: INFO 26-04-29 18:16:07.944263 - 2:40:48 - step: 21600 acc: 0 loss: 1.2375 grad: 1.49e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6228 data: 0.0803 lr: 4.23e-05 mem: 47% pow: 646.869 W 0: INFO 26-04-29 18:16:24.606830 - 2:41:05 - step: 21610 acc: 0 loss: 1.7638 grad: 1.46e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6018 data: 0.0898 lr: 4.22e-05 mem: 54% pow: 659.239 W 0: INFO 26-04-29 18:16:38.257099 - 2:41:19 - step: 21620 acc: 0 loss: 1.3158 grad: 1.52e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5858 data: 0.0957 lr: 4.22e-05 mem: 47% pow: 664.217 W 0: INFO 26-04-29 18:16:52.110431 - 2:41:32 - step: 21630 acc: 0 loss: 1.2645 grad: 1.53e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5969 data: 0.092 lr: 4.22e-05 mem: 47% pow: 650.201 W 0: INFO 26-04-29 18:17:05.637532 - 2:41:46 - step: 21640 acc: 0 loss: 1.8669 grad: 1.59e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.5936 data: 0.0966 lr: 4.22e-05 mem: 47% pow: 654.251 W 0: INFO 26-04-29 18:17:19.222725 - 2:42:00 - step: 21650 acc: 0 loss: 1.6085 grad: 1.49e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5976 data: 0.09 lr: 4.22e-05 mem: 47% pow: 667.347 W 0: INFO 26-04-29 18:17:32.854421 - 2:42:13 - step: 21660 acc: 0 loss: 1.8112 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6795 data: 0.0036 lr: 4.22e-05 mem: 47% pow: 663.201 W 0: INFO 26-04-29 18:17:46.339691 - 2:42:27 - step: 21670 acc: 0 loss: 1.3778 grad: 1.48e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6106 data: 0.0869 lr: 4.22e-05 mem: 47% pow: 645.45 W 0: INFO 26-04-29 18:18:00.008574 - 2:42:40 - step: 21680 acc: 0 loss: 1.5046 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5934 data: 0.0883 lr: 4.21e-05 mem: 47% pow: 660.552 W 0: INFO 26-04-29 18:18:13.548552 - 2:42:54 - step: 21690 acc: 0 loss: 1.3734 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.598 data: 0.0899 lr: 4.21e-05 mem: 47% pow: 658.672 W 0: INFO 26-04-29 18:18:27.360720 - 2:43:08 - step: 21700 acc: 0 loss: 1.2831 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5926 data: 0.0905 lr: 4.21e-05 mem: 47% pow: 664.586 W 0: INFO 26-04-29 18:18:43.960727 - 2:43:24 - step: 21710 acc: 0 loss: 1.2749 grad: 1.46e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.5935 data: 0.0874 lr: 4.21e-05 mem: 54% pow: 658.788 W 0: INFO 26-04-29 18:18:57.656624 - 2:43:38 - step: 21720 acc: 0 loss: 1.2664 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6276 data: 0.0858 lr: 4.21e-05 mem: 47% pow: 642.174 W 0: INFO 26-04-29 18:19:11.378070 - 2:43:52 - step: 21730 acc: 0 loss: 1.6942 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6013 data: 0.0894 lr: 4.21e-05 mem: 47% pow: 656.106 W 0: INFO 26-04-29 18:19:25.088632 - 2:44:05 - step: 21740 acc: 0 loss: 1.3257 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5972 data: 0.0943 lr: 4.21e-05 mem: 47% pow: 653.998 W 0: INFO 26-04-29 18:19:38.550194 - 2:44:19 - step: 21750 acc: 0 loss: 1.3784 grad: 1.52e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5914 data: 0.0969 lr: 4.20e-05 mem: 47% pow: 656.867 W 0: INFO 26-04-29 18:19:52.096207 - 2:44:32 - step: 21760 acc: 0 loss: 1.1056 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5857 data: 0.1039 lr: 4.20e-05 mem: 47% pow: 656.134 W 0: INFO 26-04-29 18:20:06.178272 - 2:44:46 - step: 21770 acc: 0 loss: 1.0302 grad: 1.85e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5851 data: 0.0953 lr: 4.20e-05 mem: 47% pow: 656.452 W 0: INFO 26-04-29 18:20:19.792768 - 2:45:00 - step: 21780 acc: 0 loss: 1.2545 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5864 data: 0.098 lr: 4.20e-05 mem: 47% pow: 660.0 W 0: INFO 26-04-29 18:20:33.343915 - 2:45:14 - step: 21790 acc: 0 loss: 1.543 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5861 data: 0.097 lr: 4.20e-05 mem: 47% pow: 663.012 W 0: INFO 26-04-29 18:20:47.017913 - 2:45:27 - step: 21800 acc: 0 loss: 1.6732 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6481 data: 0.1038 lr: 4.20e-05 mem: 47% pow: 615.964 W 0: INFO 26-04-29 18:21:03.624289 - 2:45:44 - step: 21810 acc: 0 loss: 1.3994 grad: 1.44e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.5912 data: 0.0899 lr: 4.19e-05 mem: 54% pow: 654.263 W 0: INFO 26-04-29 18:21:17.305185 - 2:45:58 - step: 21820 acc: 0 loss: 1.0262 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.672 data: 0.1014 lr: 4.19e-05 mem: 47% pow: 614.29 W 0: INFO 26-04-29 18:21:31.027844 - 2:46:11 - step: 21830 acc: 0 loss: 1.7172 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5874 data: 0.0921 lr: 4.19e-05 mem: 47% pow: 684.282 W 0: INFO 26-04-29 18:21:44.732042 - 2:46:25 - step: 21840 acc: 0 loss: 1.5091 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6385 data: 0.0889 lr: 4.19e-05 mem: 47% pow: 640.609 W 0: INFO 26-04-29 18:21:58.328817 - 2:46:39 - step: 21850 acc: 0 loss: 1.5602 grad: 1.56e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6293 data: 0.087 lr: 4.19e-05 mem: 47% pow: 652.879 W 0: INFO 26-04-29 18:22:11.751668 - 2:46:52 - step: 21860 acc: 0 loss: 1.3579 grad: 1.48e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5951 data: 0.0963 lr: 4.19e-05 mem: 47% pow: 658.451 W 0: INFO 26-04-29 18:22:25.419756 - 2:47:06 - step: 21870 acc: 0 loss: 1.165 grad: 1.48e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6247 data: 0.0694 lr: 4.19e-05 mem: 47% pow: 655.693 W 0: INFO 26-04-29 18:22:38.940418 - 2:47:19 - step: 21880 acc: 0 loss: 1.3944 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6692 data: 0.0527 lr: 4.18e-05 mem: 47% pow: 628.907 W 0: INFO 26-04-29 18:22:52.841104 - 2:47:33 - step: 21890 acc: 0 loss: 1.3456 grad: 1.57e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.716 data: 0.0861 lr: 4.18e-05 mem: 47% pow: 588.236 W 0: INFO 26-04-29 18:23:06.531181 - 2:47:47 - step: 21900 acc: 0 loss: 1.3288 grad: 1.43e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5932 data: 0.0951 lr: 4.18e-05 mem: 47% pow: 669.298 W 0: INFO 26-04-29 18:23:23.193838 - 2:48:03 - step: 21910 acc: 0 loss: 1.3879 grad: 1.40e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6089 data: 0.1159 lr: 4.18e-05 mem: 54% pow: 631.727 W 0: INFO 26-04-29 18:23:37.008366 - 2:48:17 - step: 21920 acc: 0 loss: 1.5291 grad: 1.62e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.608 data: 0.0808 lr: 4.18e-05 mem: 47% pow: 660.701 W 0: INFO 26-04-29 18:23:50.514989 - 2:48:31 - step: 21930 acc: 0 loss: 1.1148 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5891 data: 0.0841 lr: 4.18e-05 mem: 47% pow: 672.994 W 0: INFO 26-04-29 18:24:04.513276 - 2:48:45 - step: 21940 acc: 0 loss: 1.222 grad: 1.52e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6047 data: 0.0944 lr: 4.18e-05 mem: 47% pow: 663.561 W 0: INFO 26-04-29 18:24:18.363919 - 2:48:59 - step: 21950 acc: 0 loss: 1.2772 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5937 data: 0.0912 lr: 4.17e-05 mem: 47% pow: 663.851 W 0: INFO 26-04-29 18:24:31.905600 - 2:49:12 - step: 21960 acc: 0 loss: 1.4345 grad: 1.56e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.5776 data: 0.115 lr: 4.17e-05 mem: 47% pow: 659.886 W 0: INFO 26-04-29 18:24:45.553698 - 2:49:26 - step: 21970 acc: 0 loss: 1.5377 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5968 data: 0.0952 lr: 4.17e-05 mem: 47% pow: 648.829 W 0: INFO 26-04-29 18:24:59.322842 - 2:49:40 - step: 21980 acc: 0 loss: 1.5854 grad: 1.44e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6002 data: 0.0831 lr: 4.17e-05 mem: 47% pow: 659.605 W 0: INFO 26-04-29 18:25:12.766802 - 2:49:53 - step: 21990 acc: 0 loss: 1.4848 grad: 1.45e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6389 data: 0.0852 lr: 4.17e-05 mem: 47% pow: 644.491 W 0: INFO 26-04-29 18:25:26.252540 - 2:50:07 - step: 22000 acc: 0 loss: 1.7586 grad: 1.81e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6226 data: 0.083 lr: 4.17e-05 mem: 47% pow: 641.337 W 0: INFO 26-04-29 18:25:29.963395 - 2:50:10 - garbage collection 0: INFO 26-04-29 18:25:44.293424 - 2:50:25 - step: 22010 acc: 0 loss: 1.6094 grad: 1.48e-01 flops: 3.13e+14 wps: 3.63e+04 iter: 0.58 data: 0.0931 lr: 4.17e-05 mem: 54% pow: 672.072 W 0: INFO 26-04-29 18:25:58.099284 - 2:50:38 - step: 22020 acc: 0 loss: 1.4578 grad: 1.55e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5969 data: 0.0924 lr: 4.16e-05 mem: 47% pow: 677.215 W 0: INFO 26-04-29 18:26:11.901748 - 2:50:52 - step: 22030 acc: 0 loss: 1.4282 grad: 1.46e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6007 data: 0.0924 lr: 4.16e-05 mem: 47% pow: 651.67 W 0: INFO 26-04-29 18:26:25.606626 - 2:51:06 - step: 22040 acc: 0 loss: 1.0656 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6812 data: 0.0033 lr: 4.16e-05 mem: 47% pow: 664.76 W 0: INFO 26-04-29 18:26:39.114018 - 2:51:19 - step: 22050 acc: 0 loss: 1.8738 grad: 1.62e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5865 data: 0.0935 lr: 4.16e-05 mem: 47% pow: 659.18 W 0: INFO 26-04-29 18:26:52.504165 - 2:51:33 - step: 22060 acc: 0 loss: 1.1244 grad: 1.51e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6034 data: 0.0786 lr: 4.16e-05 mem: 47% pow: 655.858 W 0: INFO 26-04-29 18:27:06.054550 - 2:51:46 - step: 22070 acc: 0 loss: 1.3567 grad: 1.43e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.624 data: 0.0875 lr: 4.16e-05 mem: 47% pow: 650.122 W 0: INFO 26-04-29 18:27:19.741994 - 2:52:00 - step: 22080 acc: 0 loss: 1.4522 grad: 1.43e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6265 data: 0.0868 lr: 4.15e-05 mem: 47% pow: 639.82 W 0: INFO 26-04-29 18:27:33.462363 - 2:52:14 - step: 22090 acc: 0 loss: 1.4326 grad: 1.40e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7411 data: 0.0908 lr: 4.15e-05 mem: 47% pow: 579.859 W 0: INFO 26-04-29 18:27:47.406072 - 2:52:28 - step: 22100 acc: 0 loss: 1.3991 grad: 1.58e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6005 data: 0.0808 lr: 4.15e-05 mem: 47% pow: 659.27 W 0: INFO 26-04-29 18:28:04.070820 - 2:52:44 - step: 22110 acc: 0 loss: 1.1061 grad: 1.50e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5986 data: 0.0856 lr: 4.15e-05 mem: 54% pow: 662.302 W 0: INFO 26-04-29 18:28:17.514582 - 2:52:58 - step: 22120 acc: 0 loss: 1.3392 grad: 1.45e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5919 data: 0.09 lr: 4.15e-05 mem: 47% pow: 665.312 W 0: INFO 26-04-29 18:28:31.052732 - 2:53:11 - step: 22130 acc: 0 loss: 1.3372 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5816 data: 0.0882 lr: 4.15e-05 mem: 47% pow: 669.42 W 0: INFO 26-04-29 18:28:44.727943 - 2:53:25 - step: 22140 acc: 0 loss: 1.3978 grad: 1.53e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5903 data: 0.0892 lr: 4.15e-05 mem: 47% pow: 655.665 W 0: INFO 26-04-29 18:28:58.334181 - 2:53:39 - step: 22150 acc: 0 loss: 1.3744 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5909 data: 0.0953 lr: 4.14e-05 mem: 47% pow: 670.801 W 0: INFO 26-04-29 18:29:12.030175 - 2:53:52 - step: 22160 acc: 0 loss: 1.4353 grad: 1.49e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6044 data: 0.0787 lr: 4.14e-05 mem: 47% pow: 667.136 W 0: INFO 26-04-29 18:29:26.042371 - 2:54:06 - step: 22170 acc: 0 loss: 1.9712 grad: 1.52e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.592 data: 0.0823 lr: 4.14e-05 mem: 47% pow: 664.86 W 0: INFO 26-04-29 18:29:39.425319 - 2:54:20 - step: 22180 acc: 0 loss: 1.0763 grad: 1.45e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5929 data: 0.0848 lr: 4.14e-05 mem: 47% pow: 659.326 W 0: INFO 26-04-29 18:29:52.933210 - 2:54:33 - step: 22190 acc: 0 loss: 1.1598 grad: 1.45e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5955 data: 0.0846 lr: 4.14e-05 mem: 47% pow: 663.95 W 0: INFO 26-04-29 18:30:06.338141 - 2:54:47 - step: 22200 acc: 0 loss: 0.9901 grad: 1.46e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5957 data: 0.0911 lr: 4.14e-05 mem: 47% pow: 666.799 W 0: INFO 26-04-29 18:30:22.730597 - 2:55:03 - step: 22210 acc: 0 loss: 1.346 grad: 1.53e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.6155 data: 0.0873 lr: 4.14e-05 mem: 54% pow: 651.329 W 0: INFO 26-04-29 18:30:36.209648 - 2:55:17 - step: 22220 acc: 0 loss: 1.2973 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6339 data: 0.0913 lr: 4.13e-05 mem: 47% pow: 631.398 W 0: INFO 26-04-29 18:30:50.009706 - 2:55:30 - step: 22230 acc: 0 loss: 1.3206 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5918 data: 0.0889 lr: 4.13e-05 mem: 47% pow: 662.733 W 0: INFO 26-04-29 18:31:03.565645 - 2:55:44 - step: 22240 acc: 0 loss: 1.3295 grad: 1.45e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5864 data: 0.0869 lr: 4.13e-05 mem: 47% pow: 666.383 W 0: INFO 26-04-29 18:31:17.381597 - 2:55:58 - step: 22250 acc: 0 loss: 1.3705 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5975 data: 0.0996 lr: 4.13e-05 mem: 47% pow: 647.647 W 0: INFO 26-04-29 18:31:30.934212 - 2:56:11 - step: 22260 acc: 0 loss: 1.3101 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6094 data: 0.0745 lr: 4.13e-05 mem: 47% pow: 656.363 W 0: INFO 26-04-29 18:31:44.584357 - 2:56:25 - step: 22270 acc: 0 loss: 1.223 grad: 1.68e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6223 data: 0.0682 lr: 4.13e-05 mem: 47% pow: 653.723 W 0: INFO 26-04-29 18:31:58.267796 - 2:56:39 - step: 22280 acc: 0 loss: 1.6488 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6209 data: 0.0812 lr: 4.12e-05 mem: 47% pow: 642.402 W 0: INFO 26-04-29 18:32:11.724158 - 2:56:52 - step: 22290 acc: 0 loss: 1.2397 grad: 1.51e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5936 data: 0.0777 lr: 4.12e-05 mem: 47% pow: 673.064 W 0: INFO 26-04-29 18:32:25.381337 - 2:57:06 - step: 22300 acc: 0 loss: 1.6089 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7269 data: 0.0843 lr: 4.12e-05 mem: 47% pow: 594.47 W 0: INFO 26-04-29 18:32:41.809821 - 2:57:22 - step: 22310 acc: 0 loss: 1.4851 grad: 1.46e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.585 data: 0.0914 lr: 4.12e-05 mem: 54% pow: 668.897 W 0: INFO 26-04-29 18:32:55.297375 - 2:57:36 - step: 22320 acc: 0 loss: 1.5067 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6507 data: 0.0711 lr: 4.12e-05 mem: 47% pow: 642.046 W 0: INFO 26-04-29 18:33:08.994115 - 2:57:49 - step: 22330 acc: 0 loss: 1.402 grad: 1.43e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6034 data: 0.0821 lr: 4.12e-05 mem: 47% pow: 660.423 W 0: INFO 26-04-29 18:33:22.578797 - 2:58:03 - step: 22340 acc: 0 loss: 1.4034 grad: 1.66e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5887 data: 0.0837 lr: 4.12e-05 mem: 47% pow: 665.027 W 0: INFO 26-04-29 18:33:36.054195 - 2:58:16 - step: 22350 acc: 0 loss: 1.5217 grad: 1.49e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.591 data: 0.1128 lr: 4.11e-05 mem: 47% pow: 645.85 W 0: INFO 26-04-29 18:33:49.697970 - 2:58:30 - step: 22360 acc: 0 loss: 1.4817 grad: 1.52e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5808 data: 0.1988 lr: 4.11e-05 mem: 47% pow: 593.012 W 0: INFO 26-04-29 18:34:03.251663 - 2:58:44 - step: 22370 acc: 0 loss: 1.5066 grad: 1.43e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5837 data: 0.0839 lr: 4.11e-05 mem: 47% pow: 675.948 W 0: INFO 26-04-29 18:34:16.735107 - 2:58:57 - step: 22380 acc: 0 loss: 1.6299 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6047 data: 0.0942 lr: 4.11e-05 mem: 47% pow: 644.048 W 0: INFO 26-04-29 18:34:30.400464 - 2:59:11 - step: 22390 acc: 0 loss: 1.4022 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5897 data: 0.0827 lr: 4.11e-05 mem: 47% pow: 677.731 W 0: INFO 26-04-29 18:34:44.294728 - 2:59:25 - step: 22400 acc: 0 loss: 1.1493 grad: 1.52e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6009 data: 0.0828 lr: 4.11e-05 mem: 47% pow: 670.415 W 0: INFO 26-04-29 18:35:01.321329 - 2:59:42 - step: 22410 acc: 0 loss: 1.4234 grad: 1.44e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.646 data: 0.0829 lr: 4.11e-05 mem: 54% pow: 657.931 W 0: INFO 26-04-29 18:35:14.836901 - 2:59:55 - step: 22420 acc: 0 loss: 1.1707 grad: 1.43e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5786 data: 0.1143 lr: 4.10e-05 mem: 47% pow: 655.081 W 0: INFO 26-04-29 18:35:28.245709 - 3:00:09 - step: 22430 acc: 0 loss: 1.218 grad: 1.46e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6051 data: 0.0771 lr: 4.10e-05 mem: 47% pow: 656.854 W 0: INFO 26-04-29 18:35:41.879553 - 3:00:22 - step: 22440 acc: 0 loss: 1.2472 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6128 data: 0.0843 lr: 4.10e-05 mem: 47% pow: 646.033 W 0: INFO 26-04-29 18:35:55.329578 - 3:00:36 - step: 22450 acc: 0 loss: 1.2804 grad: 1.56e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5955 data: 0.0873 lr: 4.10e-05 mem: 47% pow: 661.956 W 0: INFO 26-04-29 18:36:08.704185 - 3:00:49 - step: 22460 acc: 0 loss: 1.5121 grad: 1.64e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5939 data: 0.0895 lr: 4.10e-05 mem: 47% pow: 664.414 W 0: INFO 26-04-29 18:36:22.165647 - 3:01:02 - step: 22470 acc: 0 loss: 1.2108 grad: 1.49e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5805 data: 0.0982 lr: 4.10e-05 mem: 47% pow: 655.752 W 0: INFO 26-04-29 18:36:35.625059 - 3:01:16 - step: 22480 acc: 0 loss: 1.3085 grad: 1.54e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5947 data: 0.0847 lr: 4.10e-05 mem: 47% pow: 660.498 W 0: INFO 26-04-29 18:36:49.103414 - 3:01:29 - step: 22490 acc: 0 loss: 1.1841 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5923 data: 0.0917 lr: 4.09e-05 mem: 47% pow: 660.016 W 0: INFO 26-04-29 18:37:02.620416 - 3:01:43 - step: 22500 acc: 0 loss: 1.5169 grad: 1.50e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.61 data: 0.0704 lr: 4.09e-05 mem: 47% pow: 660.16 W 0: INFO 26-04-29 18:37:19.458916 - 3:02:00 - step: 22510 acc: 0 loss: 1.4531 grad: 1.58e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.634 data: 0.0873 lr: 4.09e-05 mem: 54% pow: 634.643 W 0: INFO 26-04-29 18:37:32.910447 - 3:02:13 - step: 22520 acc: 0 loss: 1.363 grad: 1.57e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6024 data: 0.0883 lr: 4.09e-05 mem: 47% pow: 660.489 W 0: INFO 26-04-29 18:37:46.781418 - 3:02:27 - step: 22530 acc: 0 loss: 1.3416 grad: 1.50e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5917 data: 0.0871 lr: 4.09e-05 mem: 47% pow: 653.319 W 0: INFO 26-04-29 18:38:00.200901 - 3:02:40 - step: 22540 acc: 0 loss: 1.5179 grad: 1.54e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6027 data: 0.0876 lr: 4.09e-05 mem: 47% pow: 653.917 W 0: INFO 26-04-29 18:38:13.921195 - 3:02:54 - step: 22550 acc: 0 loss: 1.2809 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5971 data: 0.0868 lr: 4.08e-05 mem: 47% pow: 662.412 W 0: INFO 26-04-29 18:38:27.462127 - 3:03:08 - step: 22560 acc: 0 loss: 1.4964 grad: 1.48e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5774 data: 0.0848 lr: 4.08e-05 mem: 47% pow: 671.617 W 0: INFO 26-04-29 18:38:41.043236 - 3:03:21 - step: 22570 acc: 0 loss: 1.7762 grad: 1.48e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6201 data: 0.0941 lr: 4.08e-05 mem: 47% pow: 644.037 W 0: INFO 26-04-29 18:38:55.091659 - 3:03:35 - step: 22580 acc: 0 loss: 1.2125 grad: 1.51e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6112 data: 0.0837 lr: 4.08e-05 mem: 47% pow: 646.407 W 0: INFO 26-04-29 18:39:08.811365 - 3:03:49 - step: 22590 acc: 0 loss: 1.4707 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6689 data: 0.0629 lr: 4.08e-05 mem: 47% pow: 631.232 W 0: INFO 26-04-29 18:39:22.503913 - 3:04:03 - step: 22600 acc: 0 loss: 1.5397 grad: 1.44e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6879 data: 0.0822 lr: 4.08e-05 mem: 47% pow: 613.839 W 0: INFO 26-04-29 18:39:39.046003 - 3:04:19 - step: 22610 acc: 0 loss: 1.2015 grad: 1.56e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6337 data: 0.0764 lr: 4.08e-05 mem: 54% pow: 639.957 W 0: INFO 26-04-29 18:39:52.526448 - 3:04:33 - step: 22620 acc: 0 loss: 1.7703 grad: 1.50e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6083 data: 0.0798 lr: 4.07e-05 mem: 47% pow: 661.716 W 0: INFO 26-04-29 18:40:06.231210 - 3:04:47 - step: 22630 acc: 0 loss: 1.4237 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5964 data: 0.089 lr: 4.07e-05 mem: 47% pow: 666.254 W 0: INFO 26-04-29 18:40:20.239319 - 3:05:01 - step: 22640 acc: 0 loss: 1.3728 grad: 1.50e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6168 data: 0.0887 lr: 4.07e-05 mem: 47% pow: 648.478 W 0: INFO 26-04-29 18:40:34.100443 - 3:05:14 - step: 22650 acc: 0 loss: 1.6115 grad: 1.53e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5859 data: 0.0927 lr: 4.07e-05 mem: 47% pow: 666.51 W 0: INFO 26-04-29 18:40:47.828041 - 3:05:28 - step: 22660 acc: 0 loss: 1.3203 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5861 data: 0.1035 lr: 4.07e-05 mem: 47% pow: 653.009 W 0: INFO 26-04-29 18:41:01.639425 - 3:05:42 - step: 22670 acc: 0 loss: 1.232 grad: 1.49e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6152 data: 0.0885 lr: 4.07e-05 mem: 47% pow: 646.45 W 0: INFO 26-04-29 18:41:15.379279 - 3:05:56 - step: 22680 acc: 0 loss: 1.5161 grad: 1.43e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5913 data: 0.089 lr: 4.07e-05 mem: 47% pow: 659.855 W 0: INFO 26-04-29 18:41:28.870482 - 3:06:09 - step: 22690 acc: 0 loss: 1.3883 grad: 1.50e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6007 data: 0.0964 lr: 4.06e-05 mem: 47% pow: 645.155 W 0: INFO 26-04-29 18:41:42.282962 - 3:06:23 - step: 22700 acc: 0 loss: 1.2948 grad: 1.45e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5799 data: 0.0897 lr: 4.06e-05 mem: 47% pow: 686.393 W 0: INFO 26-04-29 18:41:58.826095 - 3:06:39 - step: 22710 acc: 0 loss: 1.5948 grad: 1.46e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6363 data: 0.0766 lr: 4.06e-05 mem: 54% pow: 645.724 W 0: INFO 26-04-29 18:42:12.405294 - 3:06:53 - step: 22720 acc: 0 loss: 1.2935 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.598 data: 0.0901 lr: 4.06e-05 mem: 47% pow: 666.053 W 0: INFO 26-04-29 18:42:25.860528 - 3:07:06 - step: 22730 acc: 0 loss: 1.18 grad: 1.45e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6201 data: 0.0844 lr: 4.06e-05 mem: 47% pow: 665.898 W 0: INFO 26-04-29 18:42:39.241153 - 3:07:20 - step: 22740 acc: 0 loss: 1.035 grad: 1.43e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.586 data: 0.0845 lr: 4.06e-05 mem: 47% pow: 676.298 W 0: INFO 26-04-29 18:42:52.744761 - 3:07:33 - step: 22750 acc: 0 loss: 1.3422 grad: 1.50e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6126 data: 0.0588 lr: 4.05e-05 mem: 47% pow: 673.56 W 0: INFO 26-04-29 18:43:06.251238 - 3:07:47 - step: 22760 acc: 0 loss: 1.7826 grad: 1.48e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6014 data: 0.08 lr: 4.05e-05 mem: 47% pow: 663.594 W 0: INFO 26-04-29 18:43:19.696946 - 3:08:00 - step: 22770 acc: 0 loss: 1.2644 grad: 1.53e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6095 data: 0.0912 lr: 4.05e-05 mem: 47% pow: 661.53 W 0: INFO 26-04-29 18:43:33.158189 - 3:08:13 - step: 22780 acc: 0 loss: 1.686 grad: 1.49e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5809 data: 0.0885 lr: 4.05e-05 mem: 47% pow: 680.661 W 0: INFO 26-04-29 18:43:46.577769 - 3:08:27 - step: 22790 acc: 0 loss: 1.161 grad: 1.57e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.612 data: 0.0701 lr: 4.05e-05 mem: 47% pow: 664.482 W 0: INFO 26-04-29 18:44:00.162944 - 3:08:40 - step: 22800 acc: 0 loss: 1.5247 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5976 data: 0.0881 lr: 4.05e-05 mem: 47% pow: 677.391 W 0: INFO 26-04-29 18:44:16.535412 - 3:08:57 - step: 22810 acc: 0 loss: 1.1806 grad: 1.59e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.5963 data: 0.0856 lr: 4.05e-05 mem: 54% pow: 659.289 W 0: INFO 26-04-29 18:44:30.199363 - 3:09:10 - step: 22820 acc: 0 loss: 1.3406 grad: 1.45e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.663 data: 0.0885 lr: 4.04e-05 mem: 47% pow: 623.282 W 0: INFO 26-04-29 18:44:43.717209 - 3:09:24 - step: 22830 acc: 0 loss: 1.1742 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5856 data: 0.0942 lr: 4.04e-05 mem: 47% pow: 657.376 W 0: INFO 26-04-29 18:44:57.446591 - 3:09:38 - step: 22840 acc: 0 loss: 1.2258 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7994 data: 0.0758 lr: 4.04e-05 mem: 47% pow: 554.432 W 0: INFO 26-04-29 18:45:10.939455 - 3:09:51 - step: 22850 acc: 0 loss: 1.5581 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5941 data: 0.0786 lr: 4.04e-05 mem: 47% pow: 666.977 W 0: INFO 26-04-29 18:45:24.449179 - 3:10:05 - step: 22860 acc: 0 loss: 1.3201 grad: 1.44e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5907 data: 0.0829 lr: 4.04e-05 mem: 47% pow: 669.701 W 0: INFO 26-04-29 18:45:37.925414 - 3:10:18 - step: 22870 acc: 0 loss: 1.0497 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6554 data: 0.063 lr: 4.04e-05 mem: 47% pow: 630.995 W 0: INFO 26-04-29 18:45:51.489205 - 3:10:32 - step: 22880 acc: 0 loss: 1.4234 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5923 data: 0.0841 lr: 4.04e-05 mem: 47% pow: 666.852 W 0: INFO 26-04-29 18:46:05.064260 - 3:10:45 - step: 22890 acc: 0 loss: 1.2338 grad: 1.49e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6022 data: 0.0817 lr: 4.03e-05 mem: 47% pow: 668.193 W 0: INFO 26-04-29 18:46:18.541853 - 3:10:59 - step: 22900 acc: 0 loss: 1.1518 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5869 data: 0.0853 lr: 4.03e-05 mem: 47% pow: 671.349 W 0: INFO 26-04-29 18:46:34.924723 - 3:11:15 - step: 22910 acc: 0 loss: 1.1614 grad: 1.42e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.5918 data: 0.0989 lr: 4.03e-05 mem: 54% pow: 657.206 W 0: INFO 26-04-29 18:46:48.545264 - 3:11:29 - step: 22920 acc: 0 loss: 1.4173 grad: 1.60e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5958 data: 0.0815 lr: 4.03e-05 mem: 47% pow: 660.984 W 0: INFO 26-04-29 18:47:02.111929 - 3:11:42 - step: 22930 acc: 0 loss: 1.1287 grad: 1.50e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5918 data: 0.086 lr: 4.03e-05 mem: 47% pow: 662.025 W 0: INFO 26-04-29 18:47:15.728405 - 3:11:56 - step: 22940 acc: 0 loss: 1.2617 grad: 1.53e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5942 data: 0.0865 lr: 4.03e-05 mem: 47% pow: 661.449 W 0: INFO 26-04-29 18:47:29.192394 - 3:12:09 - step: 22950 acc: 0 loss: 1.2292 grad: 1.53e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5817 data: 0.0979 lr: 4.03e-05 mem: 47% pow: 662.797 W 0: INFO 26-04-29 18:47:43.028554 - 3:12:23 - step: 22960 acc: 0 loss: 1.2656 grad: 1.48e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6006 data: 0.0806 lr: 4.02e-05 mem: 47% pow: 659.26 W 0: INFO 26-04-29 18:47:56.541685 - 3:12:37 - step: 22970 acc: 0 loss: 1.1764 grad: 1.48e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6036 data: 0.0899 lr: 4.02e-05 mem: 47% pow: 657.574 W 0: INFO 26-04-29 18:48:10.303430 - 3:12:51 - step: 22980 acc: 0 loss: 1.3183 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5797 data: 0.0896 lr: 4.02e-05 mem: 47% pow: 681.21 W 0: INFO 26-04-29 18:48:23.856342 - 3:13:04 - step: 22990 acc: 0 loss: 1.2853 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6113 data: 0.0912 lr: 4.02e-05 mem: 47% pow: 650.08 W 0: INFO 26-04-29 18:48:37.657167 - 3:13:18 - step: 23000 acc: 0 loss: 1.1202 grad: 1.43e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6342 data: 0.0841 lr: 4.02e-05 mem: 47% pow: 634.112 W 0: INFO 26-04-29 18:48:41.331064 - 3:13:22 - garbage collection 0: INFO 26-04-29 18:48:55.874841 - 3:13:36 - step: 23010 acc: 0 loss: 1.3157 grad: 1.61e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.6192 data: 0.0835 lr: 4.02e-05 mem: 54% pow: 644.923 W 0: INFO 26-04-29 18:49:09.810330 - 3:13:50 - step: 23020 acc: 0 loss: 1.4171 grad: 1.59e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.7206 data: 0.0761 lr: 4.01e-05 mem: 47% pow: 596.371 W 0: INFO 26-04-29 18:49:23.418257 - 3:14:04 - step: 23030 acc: 0 loss: 1.3696 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6575 data: 0.0884 lr: 4.01e-05 mem: 47% pow: 640.14 W 0: INFO 26-04-29 18:49:37.355437 - 3:14:18 - step: 23040 acc: 0 loss: 1.577 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5965 data: 0.0874 lr: 4.01e-05 mem: 47% pow: 667.921 W 0: INFO 26-04-29 18:49:51.230151 - 3:14:32 - step: 23050 acc: 0 loss: 1.2719 grad: 1.66e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6136 data: 0.0878 lr: 4.01e-05 mem: 47% pow: 639.674 W 0: INFO 26-04-29 18:50:04.943392 - 3:14:45 - step: 23060 acc: 0 loss: 1.4571 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6112 data: 0.0673 lr: 4.01e-05 mem: 47% pow: 671.065 W 0: INFO 26-04-29 18:50:18.769950 - 3:14:59 - step: 23070 acc: 0 loss: 1.2609 grad: 1.49e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5944 data: 0.0862 lr: 4.01e-05 mem: 47% pow: 661.952 W 0: INFO 26-04-29 18:50:32.350666 - 3:15:13 - step: 23080 acc: 0 loss: 1.4673 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5876 data: 0.0849 lr: 4.01e-05 mem: 47% pow: 675.569 W 0: INFO 26-04-29 18:50:45.884613 - 3:15:26 - step: 23090 acc: 0 loss: 1.1618 grad: 1.77e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6183 data: 0.0607 lr: 4.00e-05 mem: 47% pow: 661.807 W 0: INFO 26-04-29 18:50:59.695744 - 3:15:40 - step: 23100 acc: 0 loss: 1.3028 grad: 1.49e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.59 data: 0.0986 lr: 4.00e-05 mem: 47% pow: 663.103 W 0: INFO 26-04-29 18:51:16.549111 - 3:15:57 - step: 23110 acc: 0 loss: 1.3671 grad: 1.48e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.5981 data: 0.0817 lr: 4.00e-05 mem: 54% pow: 660.621 W 0: INFO 26-04-29 18:51:30.209283 - 3:16:11 - step: 23120 acc: 0 loss: 1.3518 grad: 1.51e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5844 data: 0.0917 lr: 4.00e-05 mem: 47% pow: 667.133 W 0: INFO 26-04-29 18:51:44.000916 - 3:16:24 - step: 23130 acc: 0 loss: 1.3353 grad: 1.51e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6326 data: 0.076 lr: 4.00e-05 mem: 47% pow: 650.719 W 0: INFO 26-04-29 18:51:57.802334 - 3:16:38 - step: 23140 acc: 0 loss: 1.3968 grad: 1.43e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6224 data: 0.0749 lr: 4.00e-05 mem: 47% pow: 646.889 W 0: INFO 26-04-29 18:52:11.545031 - 3:16:52 - step: 23150 acc: 0 loss: 1.357 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6884 data: 0.0897 lr: 4.00e-05 mem: 47% pow: 608.238 W 0: INFO 26-04-29 18:52:25.257973 - 3:17:06 - step: 23160 acc: 0 loss: 1.6348 grad: 1.42e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6644 data: 0.0843 lr: 3.99e-05 mem: 47% pow: 624.049 W 0: INFO 26-04-29 18:52:38.890198 - 3:17:19 - step: 23170 acc: 0 loss: 1.0814 grad: 1.45e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6629 data: 0.076 lr: 3.99e-05 mem: 47% pow: 630.999 W 0: INFO 26-04-29 18:52:52.564258 - 3:17:33 - step: 23180 acc: 0 loss: 1.5733 grad: 1.49e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.598 data: 0.091 lr: 3.99e-05 mem: 47% pow: 661.393 W 0: INFO 26-04-29 18:53:06.128451 - 3:17:46 - step: 23190 acc: 0 loss: 1.283 grad: 1.68e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5817 data: 0.1165 lr: 3.99e-05 mem: 47% pow: 645.484 W 0: INFO 26-04-29 18:53:20.065636 - 3:18:00 - step: 23200 acc: 0 loss: 1.3098 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6078 data: 0.0906 lr: 3.99e-05 mem: 47% pow: 648.632 W 0: INFO 26-04-29 18:53:36.725952 - 3:18:17 - step: 23210 acc: 0 loss: 1.3002 grad: 1.62e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5883 data: 0.0916 lr: 3.99e-05 mem: 54% pow: 663.685 W 0: INFO 26-04-29 18:53:50.561473 - 3:18:31 - step: 23220 acc: 0 loss: 1.271 grad: 1.62e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6638 data: 0.0933 lr: 3.99e-05 mem: 47% pow: 615.266 W 0: INFO 26-04-29 18:54:04.106788 - 3:18:44 - step: 23230 acc: 0 loss: 1.4402 grad: 1.49e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5959 data: 0.0862 lr: 3.98e-05 mem: 47% pow: 663.616 W 0: INFO 26-04-29 18:54:17.693968 - 3:18:58 - step: 23240 acc: 0 loss: 1.1394 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5927 data: 0.0902 lr: 3.98e-05 mem: 47% pow: 662.437 W 0: INFO 26-04-29 18:54:31.399228 - 3:19:12 - step: 23250 acc: 0 loss: 1.2116 grad: 1.60e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5792 data: 0.0896 lr: 3.98e-05 mem: 47% pow: 673.224 W 0: INFO 26-04-29 18:54:45.271002 - 3:19:26 - step: 23260 acc: 0 loss: 1.4457 grad: 1.52e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5806 data: 0.1777 lr: 3.98e-05 mem: 47% pow: 619.132 W 0: INFO 26-04-29 18:54:58.828083 - 3:19:39 - step: 23270 acc: 0 loss: 1.5052 grad: 1.54e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5925 data: 0.0893 lr: 3.98e-05 mem: 47% pow: 661.634 W 0: INFO 26-04-29 18:55:12.371072 - 3:19:53 - step: 23280 acc: 0 loss: 1.3928 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5958 data: 0.0874 lr: 3.98e-05 mem: 47% pow: 661.759 W 0: INFO 26-04-29 18:55:26.375116 - 3:20:07 - step: 23290 acc: 0 loss: 1.3986 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6308 data: 0.0709 lr: 3.97e-05 mem: 47% pow: 658.536 W 0: INFO 26-04-29 18:55:39.886521 - 3:20:20 - step: 23300 acc: 0 loss: 1.3503 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6187 data: 0.0812 lr: 3.97e-05 mem: 47% pow: 647.307 W 0: INFO 26-04-29 18:55:56.994003 - 3:20:37 - step: 23310 acc: 0 loss: 1.2274 grad: 1.51e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.5965 data: 0.0907 lr: 3.97e-05 mem: 54% pow: 650.632 W 0: INFO 26-04-29 18:56:10.565049 - 3:20:51 - step: 23320 acc: 0 loss: 1.462 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.671 data: 0.048 lr: 3.97e-05 mem: 47% pow: 644.484 W 0: INFO 26-04-29 18:56:24.493116 - 3:21:05 - step: 23330 acc: 0 loss: 1.2578 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6017 data: 0.0849 lr: 3.97e-05 mem: 47% pow: 665.925 W 0: INFO 26-04-29 18:56:38.153164 - 3:21:18 - step: 23340 acc: 0 loss: 1.2153 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6085 data: 0.0916 lr: 3.97e-05 mem: 47% pow: 646.117 W 0: INFO 26-04-29 18:56:51.878735 - 3:21:32 - step: 23350 acc: 0 loss: 1.3664 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7168 data: 0.0897 lr: 3.97e-05 mem: 47% pow: 594.08 W 0: INFO 26-04-29 18:57:05.457952 - 3:21:46 - step: 23360 acc: 0 loss: 1.5633 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6102 data: 0.0788 lr: 3.96e-05 mem: 47% pow: 672.137 W 0: INFO 26-04-29 18:57:19.276171 - 3:22:00 - step: 23370 acc: 0 loss: 1.3138 grad: 1.52e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5838 data: 0.1247 lr: 3.96e-05 mem: 47% pow: 645.139 W 0: INFO 26-04-29 18:57:33.097758 - 3:22:13 - step: 23380 acc: 0 loss: 1.7099 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5918 data: 0.0931 lr: 3.96e-05 mem: 47% pow: 673.455 W 0: INFO 26-04-29 18:57:46.739764 - 3:22:27 - step: 23390 acc: 0 loss: 1.319 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5841 data: 0.0917 lr: 3.96e-05 mem: 47% pow: 662.285 W 0: INFO 26-04-29 18:58:00.581998 - 3:22:41 - step: 23400 acc: 0 loss: 1.2071 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6398 data: 0.0518 lr: 3.96e-05 mem: 47% pow: 662.549 W 0: INFO 26-04-29 18:58:17.414308 - 3:22:58 - step: 23410 acc: 0 loss: 1.3757 grad: 1.46e-01 flops: 3.36e+14 wps: 3.89e+04 iter: 0.6239 data: 0.0854 lr: 3.96e-05 mem: 54% pow: 654.362 W 0: INFO 26-04-29 18:58:31.073275 - 3:23:11 - step: 23420 acc: 0 loss: 1.234 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5921 data: 0.0912 lr: 3.96e-05 mem: 47% pow: 665.368 W 0: INFO 26-04-29 18:58:44.647676 - 3:23:25 - step: 23430 acc: 0 loss: 1.4748 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5968 data: 0.0821 lr: 3.95e-05 mem: 47% pow: 657.027 W 0: INFO 26-04-29 18:58:58.202145 - 3:23:38 - step: 23440 acc: 0 loss: 1.3249 grad: 1.77e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6223 data: 0.0715 lr: 3.95e-05 mem: 47% pow: 662.752 W 0: INFO 26-04-29 18:59:11.757605 - 3:23:52 - step: 23450 acc: 0 loss: 1.5483 grad: 1.52e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5968 data: 0.0762 lr: 3.95e-05 mem: 47% pow: 660.055 W 0: INFO 26-04-29 18:59:25.246489 - 3:24:06 - step: 23460 acc: 0 loss: 1.9106 grad: 1.56e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5883 data: 0.0908 lr: 3.95e-05 mem: 47% pow: 661.688 W 0: INFO 26-04-29 18:59:38.725231 - 3:24:19 - step: 23470 acc: 0 loss: 1.028 grad: 1.45e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5938 data: 0.0811 lr: 3.95e-05 mem: 47% pow: 664.573 W 0: INFO 26-04-29 18:59:52.638942 - 3:24:33 - step: 23480 acc: 0 loss: 1.3705 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5908 data: 0.085 lr: 3.95e-05 mem: 47% pow: 671.405 W 0: INFO 26-04-29 19:00:06.098213 - 3:24:46 - step: 23490 acc: 0 loss: 1.2052 grad: 1.52e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5958 data: 0.0887 lr: 3.94e-05 mem: 47% pow: 661.172 W 0: INFO 26-04-29 19:00:19.732123 - 3:25:00 - step: 23500 acc: 0 loss: 1.341 grad: 1.62e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6374 data: 0.0689 lr: 3.94e-05 mem: 47% pow: 660.531 W 0: INFO 26-04-29 19:00:36.229976 - 3:25:17 - step: 23510 acc: 0 loss: 1.253 grad: 1.51e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5823 data: 0.0969 lr: 3.94e-05 mem: 54% pow: 656.318 W 0: INFO 26-04-29 19:00:49.933863 - 3:25:30 - step: 23520 acc: 0 loss: 1.4459 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6176 data: 0.0886 lr: 3.94e-05 mem: 47% pow: 654.467 W 0: INFO 26-04-29 19:01:03.622060 - 3:25:44 - step: 23530 acc: 0 loss: 1.2533 grad: 1.61e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5938 data: 0.093 lr: 3.94e-05 mem: 47% pow: 665.839 W 0: INFO 26-04-29 19:01:17.469572 - 3:25:58 - step: 23540 acc: 0 loss: 1.539 grad: 1.41e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.588 data: 0.0924 lr: 3.94e-05 mem: 47% pow: 659.729 W 0: INFO 26-04-29 19:01:30.988326 - 3:26:11 - step: 23550 acc: 0 loss: 1.8337 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5934 data: 0.0823 lr: 3.94e-05 mem: 47% pow: 668.315 W 0: INFO 26-04-29 19:01:44.837392 - 3:26:25 - step: 23560 acc: 0 loss: 1.2647 grad: 1.59e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6298 data: 0.0766 lr: 3.93e-05 mem: 47% pow: 660.566 W 0: INFO 26-04-29 19:01:58.585438 - 3:26:39 - step: 23570 acc: 0 loss: 1.311 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7563 data: 0.0878 lr: 3.93e-05 mem: 47% pow: 577.203 W 0: INFO 26-04-29 19:02:12.284404 - 3:26:53 - step: 23580 acc: 0 loss: 1.5333 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6529 data: 0.0267 lr: 3.93e-05 mem: 47% pow: 659.848 W 0: INFO 26-04-29 19:02:25.935094 - 3:27:06 - step: 23590 acc: 0 loss: 1.6441 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5954 data: 0.0938 lr: 3.93e-05 mem: 47% pow: 655.852 W 0: INFO 26-04-29 19:02:39.761579 - 3:27:20 - step: 23600 acc: 0 loss: 1.4241 grad: 1.46e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5851 data: 0.0853 lr: 3.93e-05 mem: 47% pow: 672.443 W 0: INFO 26-04-29 19:02:56.573115 - 3:27:37 - step: 23610 acc: 0 loss: 1.6654 grad: 1.45e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6432 data: 0.0646 lr: 3.93e-05 mem: 54% pow: 659.146 W 0: INFO 26-04-29 19:03:10.205993 - 3:27:51 - step: 23620 acc: 0 loss: 1.2001 grad: 1.50e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5824 data: 0.0884 lr: 3.93e-05 mem: 47% pow: 674.19 W 0: INFO 26-04-29 19:03:23.772157 - 3:28:04 - step: 23630 acc: 0 loss: 1.696 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.626 data: 0.0837 lr: 3.92e-05 mem: 47% pow: 662.753 W 0: INFO 26-04-29 19:03:37.272652 - 3:28:18 - step: 23640 acc: 0 loss: 1.3708 grad: 1.44e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6016 data: 0.0832 lr: 3.92e-05 mem: 47% pow: 666.187 W 0: INFO 26-04-29 19:03:50.927863 - 3:28:31 - step: 23650 acc: 0 loss: 1.6069 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6178 data: 0.0981 lr: 3.92e-05 mem: 47% pow: 632.87 W 0: INFO 26-04-29 19:04:04.502678 - 3:28:45 - step: 23660 acc: 0 loss: 1.5917 grad: 1.65e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6109 data: 0.0877 lr: 3.92e-05 mem: 47% pow: 645.996 W 0: INFO 26-04-29 19:04:18.138452 - 3:28:58 - step: 23670 acc: 0 loss: 1.3678 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5929 data: 0.0936 lr: 3.92e-05 mem: 47% pow: 656.584 W 0: INFO 26-04-29 19:04:31.729869 - 3:29:12 - step: 23680 acc: 0 loss: 1.2958 grad: 1.46e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6529 data: 0.0885 lr: 3.92e-05 mem: 47% pow: 622.894 W 0: INFO 26-04-29 19:04:45.223553 - 3:29:26 - step: 23690 acc: 0 loss: 1.4135 grad: 1.77e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6093 data: 0.0702 lr: 3.92e-05 mem: 47% pow: 657.325 W 0: INFO 26-04-29 19:04:58.847981 - 3:29:39 - step: 23700 acc: 0 loss: 1.3681 grad: 1.49e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5861 data: 0.0918 lr: 3.91e-05 mem: 47% pow: 667.012 W 0: INFO 26-04-29 19:05:15.517322 - 3:29:56 - step: 23710 acc: 0 loss: 1.4258 grad: 1.40e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6201 data: 0.0859 lr: 3.91e-05 mem: 54% pow: 668.302 W 0: INFO 26-04-29 19:05:29.358041 - 3:30:10 - step: 23720 acc: 0 loss: 1.3552 grad: 1.46e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6178 data: 0.0919 lr: 3.91e-05 mem: 47% pow: 650.267 W 0: INFO 26-04-29 19:05:43.018014 - 3:30:23 - step: 23730 acc: 0 loss: 1.3328 grad: 1.44e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6402 data: 0.0906 lr: 3.91e-05 mem: 47% pow: 640.094 W 0: INFO 26-04-29 19:05:56.639531 - 3:30:37 - step: 23740 acc: 0 loss: 1.2934 grad: 1.44e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6208 data: 0.0855 lr: 3.91e-05 mem: 47% pow: 649.072 W 0: INFO 26-04-29 19:06:10.163711 - 3:30:50 - step: 23750 acc: 0 loss: 1.2717 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5912 data: 0.0862 lr: 3.91e-05 mem: 47% pow: 661.647 W 0: INFO 26-04-29 19:06:23.755923 - 3:31:04 - step: 23760 acc: 0 loss: 1.5207 grad: 1.40e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5818 data: 0.0887 lr: 3.90e-05 mem: 47% pow: 668.614 W 0: INFO 26-04-29 19:06:37.253668 - 3:31:18 - step: 23770 acc: 0 loss: 1.2645 grad: 1.49e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5987 data: 0.0895 lr: 3.90e-05 mem: 47% pow: 663.472 W 0: INFO 26-04-29 19:06:50.777738 - 3:31:31 - step: 23780 acc: 0 loss: 1.2335 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5807 data: 0.0919 lr: 3.90e-05 mem: 47% pow: 679.118 W 0: INFO 26-04-29 19:07:04.349760 - 3:31:45 - step: 23790 acc: 0 loss: 1.4478 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6446 data: 0.0775 lr: 3.90e-05 mem: 47% pow: 639.05 W 0: INFO 26-04-29 19:07:17.944611 - 3:31:58 - step: 23800 acc: 0 loss: 1.4769 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5939 data: 0.0887 lr: 3.90e-05 mem: 47% pow: 663.867 W 0: INFO 26-04-29 19:07:34.724752 - 3:32:15 - step: 23810 acc: 0 loss: 1.6515 grad: 1.46e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6064 data: 0.082 lr: 3.90e-05 mem: 54% pow: 665.984 W 0: INFO 26-04-29 19:07:48.224901 - 3:32:29 - step: 23820 acc: 0 loss: 1.0738 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.623 data: 0.0887 lr: 3.90e-05 mem: 47% pow: 639.482 W 0: INFO 26-04-29 19:08:01.847210 - 3:32:42 - step: 23830 acc: 0 loss: 1.5125 grad: 1.43e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6131 data: 0.0843 lr: 3.89e-05 mem: 47% pow: 652.907 W 0: INFO 26-04-29 19:08:15.685992 - 3:32:56 - step: 23840 acc: 0 loss: 1.5322 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7238 data: 0.0947 lr: 3.89e-05 mem: 47% pow: 582.86 W 0: INFO 26-04-29 19:08:29.096009 - 3:33:09 - step: 23850 acc: 0 loss: 1.4674 grad: 1.47e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.597 data: 0.0703 lr: 3.89e-05 mem: 47% pow: 681.295 W 0: INFO 26-04-29 19:08:42.946020 - 3:33:23 - step: 23860 acc: 0 loss: 1.5076 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6355 data: 0.0867 lr: 3.89e-05 mem: 47% pow: 590.248 W 0: INFO 26-04-29 19:08:56.513058 - 3:33:37 - step: 23870 acc: 0 loss: 1.2192 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5896 data: 0.082 lr: 3.89e-05 mem: 47% pow: 683.397 W 0: INFO 26-04-29 19:09:09.974413 - 3:33:50 - step: 23880 acc: 0 loss: 1.4292 grad: 1.46e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6449 data: 0.0967 lr: 3.89e-05 mem: 47% pow: 624.877 W 0: INFO 26-04-29 19:09:23.394359 - 3:34:04 - step: 23890 acc: 0 loss: 1.4596 grad: 1.47e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5894 data: 0.0936 lr: 3.89e-05 mem: 47% pow: 660.743 W 0: INFO 26-04-29 19:09:37.025289 - 3:34:17 - step: 23900 acc: 0 loss: 1.63 grad: 1.39e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.58 data: 0.0989 lr: 3.88e-05 mem: 47% pow: 666.828 W 0: INFO 26-04-29 19:09:53.716145 - 3:34:34 - step: 23910 acc: 0 loss: 1.3891 grad: 1.45e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6101 data: 0.0761 lr: 3.88e-05 mem: 54% pow: 665.908 W 0: INFO 26-04-29 19:10:07.412716 - 3:34:48 - step: 23920 acc: 0 loss: 1.3462 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5874 data: 0.09 lr: 3.88e-05 mem: 47% pow: 661.712 W 0: INFO 26-04-29 19:10:21.129585 - 3:35:01 - step: 23930 acc: 0 loss: 1.3813 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6028 data: 0.088 lr: 3.88e-05 mem: 47% pow: 660.558 W 0: INFO 26-04-29 19:10:34.612697 - 3:35:15 - step: 23940 acc: 0 loss: 1.4069 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5919 data: 0.0887 lr: 3.88e-05 mem: 47% pow: 668.683 W 0: INFO 26-04-29 19:10:48.088718 - 3:35:28 - step: 23950 acc: 0 loss: 1.2679 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5928 data: 0.0876 lr: 3.88e-05 mem: 47% pow: 663.199 W 0: INFO 26-04-29 19:11:01.537638 - 3:35:42 - step: 23960 acc: 0 loss: 1.4747 grad: 1.46e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5821 data: 0.0868 lr: 3.87e-05 mem: 47% pow: 677.895 W 0: INFO 26-04-29 19:11:15.185309 - 3:35:55 - step: 23970 acc: 0 loss: 1.4239 grad: 1.62e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5852 data: 0.0893 lr: 3.87e-05 mem: 47% pow: 663.616 W 0: INFO 26-04-29 19:11:28.806534 - 3:36:09 - step: 23980 acc: 0 loss: 1.2609 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5801 data: 0.1086 lr: 3.87e-05 mem: 47% pow: 657.829 W 0: INFO 26-04-29 19:11:42.653361 - 3:36:23 - step: 23990 acc: 0 loss: 1.1519 grad: 1.45e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6067 data: 0.0764 lr: 3.87e-05 mem: 47% pow: 670.757 W 0: INFO 26-04-29 19:11:56.454743 - 3:36:37 - step: 24000 acc: 0 loss: 1.3269 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5965 data: 0.0822 lr: 3.87e-05 mem: 47% pow: 660.153 W 0: INFO 26-04-29 19:12:00.233446 - 3:36:41 - garbage collection 0: INFO 26-04-29 19:12:14.618730 - 3:36:55 - step: 24010 acc: 0 loss: 1.4457 grad: 1.38e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.6262 data: 0.078 lr: 3.87e-05 mem: 54% pow: 649.443 W 0: INFO 26-04-29 19:12:28.367355 - 3:37:09 - step: 24020 acc: 0 loss: 1.401 grad: 1.44e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5926 data: 0.088 lr: 3.87e-05 mem: 47% pow: 682.544 W 0: INFO 26-04-29 19:12:41.807217 - 3:37:22 - step: 24030 acc: 0 loss: 1.3476 grad: 1.51e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.581 data: 0.089 lr: 3.86e-05 mem: 47% pow: 662.978 W 0: INFO 26-04-29 19:12:55.495793 - 3:37:36 - step: 24040 acc: 0 loss: 1.9824 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5952 data: 0.0911 lr: 3.86e-05 mem: 47% pow: 668.911 W 0: INFO 26-04-29 19:13:09.029229 - 3:37:49 - step: 24050 acc: 0 loss: 1.3839 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6287 data: 0.0881 lr: 3.86e-05 mem: 47% pow: 641.63 W 0: INFO 26-04-29 19:13:22.656733 - 3:38:03 - step: 24060 acc: 0 loss: 1.0581 grad: 1.53e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6107 data: 0.0899 lr: 3.86e-05 mem: 47% pow: 642.369 W 0: INFO 26-04-29 19:13:36.556316 - 3:38:17 - step: 24070 acc: 0 loss: 1.194 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6064 data: 0.089 lr: 3.86e-05 mem: 47% pow: 653.72 W 0: INFO 26-04-29 19:13:50.188269 - 3:38:30 - step: 24080 acc: 0 loss: 1.6653 grad: 1.54e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5857 data: 0.0915 lr: 3.86e-05 mem: 47% pow: 661.954 W 0: INFO 26-04-29 19:14:03.771599 - 3:38:44 - step: 24090 acc: 0 loss: 1.2523 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6268 data: 0.0842 lr: 3.86e-05 mem: 47% pow: 650.753 W 0: INFO 26-04-29 19:14:17.254417 - 3:38:58 - step: 24100 acc: 0 loss: 1.4494 grad: 1.56e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5822 data: 0.0935 lr: 3.85e-05 mem: 47% pow: 667.614 W 0: INFO 26-04-29 19:14:33.904375 - 3:39:14 - step: 24110 acc: 0 loss: 1.3531 grad: 1.45e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5782 data: 0.1053 lr: 3.85e-05 mem: 54% pow: 664.877 W 0: INFO 26-04-29 19:14:47.496042 - 3:39:28 - step: 24120 acc: 0 loss: 1.3329 grad: 1.43e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6064 data: 0.0924 lr: 3.85e-05 mem: 47% pow: 648.412 W 0: INFO 26-04-29 19:15:01.075038 - 3:39:41 - step: 24130 acc: 0 loss: 1.377 grad: 1.44e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.619 data: 0.0835 lr: 3.85e-05 mem: 47% pow: 650.518 W 0: INFO 26-04-29 19:15:14.704035 - 3:39:55 - step: 24140 acc: 0 loss: 1.7048 grad: 1.55e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5973 data: 0.0884 lr: 3.85e-05 mem: 47% pow: 665.267 W 0: INFO 26-04-29 19:15:28.218398 - 3:40:09 - step: 24150 acc: 0 loss: 1.6108 grad: 1.45e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.595 data: 0.0851 lr: 3.85e-05 mem: 47% pow: 654.869 W 0: INFO 26-04-29 19:15:41.711647 - 3:40:22 - step: 24160 acc: 0 loss: 1.2295 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6689 data: 0.088 lr: 3.85e-05 mem: 47% pow: 610.691 W 0: INFO 26-04-29 19:15:55.281977 - 3:40:36 - step: 24170 acc: 0 loss: 1.2409 grad: 1.46e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6299 data: 0.0781 lr: 3.84e-05 mem: 47% pow: 646.409 W 0: INFO 26-04-29 19:16:08.663259 - 3:40:49 - step: 24180 acc: 0 loss: 1.3716 grad: 1.46e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5827 data: 0.0988 lr: 3.84e-05 mem: 47% pow: 664.651 W 0: INFO 26-04-29 19:16:22.141408 - 3:41:02 - step: 24190 acc: 0 loss: 1.2459 grad: 1.45e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.597 data: 0.0884 lr: 3.84e-05 mem: 47% pow: 671.98 W 0: INFO 26-04-29 19:16:35.800129 - 3:41:16 - step: 24200 acc: 0 loss: 1.3673 grad: 1.52e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6109 data: 0.0851 lr: 3.84e-05 mem: 47% pow: 651.253 W 0: INFO 26-04-29 19:16:52.545834 - 3:41:33 - step: 24210 acc: 0 loss: 1.3926 grad: 1.44e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.589 data: 0.0918 lr: 3.84e-05 mem: 54% pow: 654.012 W 0: INFO 26-04-29 19:17:06.359079 - 3:41:47 - step: 24220 acc: 0 loss: 1.4568 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6622 data: 0.083 lr: 3.84e-05 mem: 47% pow: 630.322 W 0: INFO 26-04-29 19:17:19.982043 - 3:42:00 - step: 24230 acc: 0 loss: 1.5398 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5775 data: 0.1285 lr: 3.83e-05 mem: 47% pow: 642.27 W 0: INFO 26-04-29 19:17:33.640698 - 3:42:14 - step: 24240 acc: 0 loss: 1.3738 grad: 1.46e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6469 data: 0.0207 lr: 3.83e-05 mem: 47% pow: 679.353 W 0: INFO 26-04-29 19:17:47.069397 - 3:42:27 - step: 24250 acc: 0 loss: 1.5168 grad: 1.45e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6396 data: 0.089 lr: 3.83e-05 mem: 47% pow: 644.106 W 0: INFO 26-04-29 19:18:00.682524 - 3:42:41 - step: 24260 acc: 0 loss: 1.2577 grad: 1.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5881 data: 0.0986 lr: 3.83e-05 mem: 47% pow: 665.595 W 0: INFO 26-04-29 19:18:14.361169 - 3:42:55 - step: 24270 acc: 0 loss: 1.2929 grad: 1.48e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6251 data: 0.0758 lr: 3.83e-05 mem: 47% pow: 642.653 W 0: INFO 26-04-29 19:18:27.961119 - 3:43:08 - step: 24280 acc: 0 loss: 1.3818 grad: 1.45e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6297 data: 0.088 lr: 3.83e-05 mem: 47% pow: 629.709 W 0: INFO 26-04-29 19:18:41.410289 - 3:43:22 - step: 24290 acc: 0 loss: 1.3263 grad: 1.52e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5776 data: 0.1055 lr: 3.83e-05 mem: 47% pow: 666.266 W 0: INFO 26-04-29 19:18:54.962788 - 3:43:35 - step: 24300 acc: 0 loss: 1.2001 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6131 data: 0.0829 lr: 3.82e-05 mem: 47% pow: 651.76 W 0: INFO 26-04-29 19:19:11.272722 - 3:43:52 - step: 24310 acc: 0 loss: 1.4196 grad: 1.63e-01 flops: 3.46e+14 wps: 4.02e+04 iter: 0.5832 data: 0.0949 lr: 3.82e-05 mem: 54% pow: 660.54 W 0: INFO 26-04-29 19:19:24.728019 - 3:44:05 - step: 24320 acc: 0 loss: 1.601 grad: 1.63e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6053 data: 0.085 lr: 3.82e-05 mem: 47% pow: 652.475 W 0: INFO 26-04-29 19:19:38.273633 - 3:44:19 - step: 24330 acc: 0 loss: 1.4435 grad: 1.45e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.603 data: 0.0839 lr: 3.82e-05 mem: 47% pow: 666.013 W 0: INFO 26-04-29 19:19:51.815061 - 3:44:32 - step: 24340 acc: 0 loss: 1.4815 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5987 data: 0.082 lr: 3.82e-05 mem: 47% pow: 661.36 W 0: INFO 26-04-29 19:20:05.308005 - 3:44:46 - step: 24350 acc: 0 loss: 1.7399 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.592 data: 0.1003 lr: 3.82e-05 mem: 47% pow: 657.127 W 0: INFO 26-04-29 19:20:18.684701 - 3:44:59 - step: 24360 acc: 0 loss: 1.3812 grad: 1.49e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5791 data: 0.1085 lr: 3.82e-05 mem: 47% pow: 665.825 W 0: INFO 26-04-29 19:20:32.152744 - 3:45:12 - step: 24370 acc: 0 loss: 1.3739 grad: 1.48e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5812 data: 0.1019 lr: 3.81e-05 mem: 47% pow: 663.962 W 0: INFO 26-04-29 19:20:45.625941 - 3:45:26 - step: 24380 acc: 0 loss: 1.5998 grad: 1.47e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6189 data: 0.0878 lr: 3.81e-05 mem: 47% pow: 647.263 W 0: INFO 26-04-29 19:20:59.178288 - 3:45:39 - step: 24390 acc: 0 loss: 1.3037 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6118 data: 0.1056 lr: 3.81e-05 mem: 47% pow: 638.929 W 0: INFO 26-04-29 19:21:12.682826 - 3:45:53 - step: 24400 acc: 0 loss: 1.0897 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5905 data: 0.0962 lr: 3.81e-05 mem: 47% pow: 665.045 W 0: INFO 26-04-29 19:21:29.390923 - 3:46:10 - step: 24410 acc: 0 loss: 1.3632 grad: 1.47e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.598 data: 0.0897 lr: 3.81e-05 mem: 54% pow: 665.77 W 0: INFO 26-04-29 19:21:42.897720 - 3:46:23 - step: 24420 acc: 0 loss: 1.6462 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.585 data: 0.0906 lr: 3.81e-05 mem: 47% pow: 671.031 W 0: INFO 26-04-29 19:21:56.470348 - 3:46:37 - step: 24430 acc: 0 loss: 1.0354 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6104 data: 0.0792 lr: 3.80e-05 mem: 47% pow: 661.137 W 0: INFO 26-04-29 19:22:10.254436 - 3:46:51 - step: 24440 acc: 0 loss: 1.355 grad: 1.44e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.627 data: 0.0648 lr: 3.80e-05 mem: 47% pow: 656.396 W 0: INFO 26-04-29 19:22:23.773557 - 3:47:04 - step: 24450 acc: 0 loss: 1.3475 grad: 1.46e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6163 data: 0.077 lr: 3.80e-05 mem: 47% pow: 655.086 W 0: INFO 26-04-29 19:22:37.325432 - 3:47:18 - step: 24460 acc: 0 loss: 1.2777 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5994 data: 0.0786 lr: 3.80e-05 mem: 47% pow: 663.144 W 0: INFO 26-04-29 19:22:51.042104 - 3:47:31 - step: 24470 acc: 0 loss: 1.4088 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6568 data: 0.081 lr: 3.80e-05 mem: 47% pow: 627.563 W 0: INFO 26-04-29 19:23:04.749129 - 3:47:45 - step: 24480 acc: 0 loss: 1.0634 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5813 data: 0.0894 lr: 3.80e-05 mem: 47% pow: 677.365 W 0: INFO 26-04-29 19:23:18.339227 - 3:47:59 - step: 24490 acc: 0 loss: 1.1582 grad: 1.49e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6111 data: 0.0687 lr: 3.80e-05 mem: 47% pow: 661.339 W 0: INFO 26-04-29 19:23:31.924006 - 3:48:12 - step: 24500 acc: 0 loss: 1.4016 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6051 data: 0.0819 lr: 3.79e-05 mem: 47% pow: 663.324 W 0: INFO 26-04-29 19:23:48.252745 - 3:48:29 - step: 24510 acc: 0 loss: 1.1396 grad: 1.41e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.59 data: 0.0843 lr: 3.79e-05 mem: 54% pow: 665.659 W 0: INFO 26-04-29 19:24:01.878473 - 3:48:42 - step: 24520 acc: 0 loss: 1.4743 grad: 1.45e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6462 data: 0.0911 lr: 3.79e-05 mem: 47% pow: 636.079 W 0: INFO 26-04-29 19:24:15.849118 - 3:48:56 - step: 24530 acc: 0 loss: 1.2929 grad: 1.49e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6003 data: 0.0852 lr: 3.79e-05 mem: 47% pow: 659.556 W 0: INFO 26-04-29 19:24:29.324401 - 3:49:10 - step: 24540 acc: 0 loss: 1.4285 grad: 1.45e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5937 data: 0.0873 lr: 3.79e-05 mem: 47% pow: 672.763 W 0: INFO 26-04-29 19:24:42.904588 - 3:49:23 - step: 24550 acc: 0 loss: 1.6088 grad: 1.49e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6737 data: 0.0861 lr: 3.79e-05 mem: 47% pow: 612.225 W 0: INFO 26-04-29 19:24:56.392213 - 3:49:37 - step: 24560 acc: 0 loss: 1.4613 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6075 data: 0.0732 lr: 3.79e-05 mem: 47% pow: 666.183 W 0: INFO 26-04-29 19:25:10.162409 - 3:49:50 - step: 24570 acc: 0 loss: 1.4071 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6096 data: 0.0865 lr: 3.78e-05 mem: 47% pow: 648.741 W 0: INFO 26-04-29 19:25:23.914311 - 3:50:04 - step: 24580 acc: 0 loss: 1.4318 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6256 data: 0.0703 lr: 3.78e-05 mem: 47% pow: 655.304 W 0: INFO 26-04-29 19:25:37.390653 - 3:50:18 - step: 24590 acc: 0 loss: 1.3949 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6143 data: 0.079 lr: 3.78e-05 mem: 47% pow: 659.912 W 0: INFO 26-04-29 19:25:50.969368 - 3:50:31 - step: 24600 acc: 0 loss: 1.0264 grad: 1.49e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6164 data: 0.0879 lr: 3.78e-05 mem: 47% pow: 646.393 W 0: INFO 26-04-29 19:26:07.637678 - 3:50:48 - step: 24610 acc: 0 loss: 1.4833 grad: 1.53e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5956 data: 0.0848 lr: 3.78e-05 mem: 54% pow: 658.025 W 0: INFO 26-04-29 19:26:21.443517 - 3:51:02 - step: 24620 acc: 0 loss: 1.5813 grad: 1.46e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6106 data: 0.0876 lr: 3.78e-05 mem: 47% pow: 654.383 W 0: INFO 26-04-29 19:26:35.078460 - 3:51:15 - step: 24630 acc: 0 loss: 1.2826 grad: 1.46e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6135 data: 0.085 lr: 3.78e-05 mem: 47% pow: 644.55 W 0: INFO 26-04-29 19:26:48.807657 - 3:51:29 - step: 24640 acc: 0 loss: 1.3933 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6178 data: 0.0667 lr: 3.77e-05 mem: 47% pow: 669.346 W 0: INFO 26-04-29 19:27:02.556415 - 3:51:43 - step: 24650 acc: 0 loss: 1.7707 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6587 data: 0.085 lr: 3.77e-05 mem: 47% pow: 625.218 W 0: INFO 26-04-29 19:27:16.113776 - 3:51:56 - step: 24660 acc: 0 loss: 1.0392 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5812 data: 0.1294 lr: 3.77e-05 mem: 47% pow: 644.396 W 0: INFO 26-04-29 19:27:29.793896 - 3:52:10 - step: 24670 acc: 0 loss: 1.3053 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5959 data: 0.0944 lr: 3.77e-05 mem: 47% pow: 658.25 W 0: INFO 26-04-29 19:27:43.489153 - 3:52:24 - step: 24680 acc: 0 loss: 1.4775 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6123 data: 0.0752 lr: 3.77e-05 mem: 47% pow: 654.662 W 0: INFO 26-04-29 19:27:56.939407 - 3:52:37 - step: 24690 acc: 0 loss: 1.7579 grad: 1.47e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5984 data: 0.0806 lr: 3.77e-05 mem: 47% pow: 670.637 W 0: INFO 26-04-29 19:28:10.631709 - 3:52:51 - step: 24700 acc: 0 loss: 1.3884 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5802 data: 0.091 lr: 3.76e-05 mem: 47% pow: 669.03 W 0: INFO 26-04-29 19:28:27.467091 - 3:53:08 - step: 24710 acc: 0 loss: 1.6423 grad: 1.50e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.5999 data: 0.0874 lr: 3.76e-05 mem: 54% pow: 666.425 W 0: INFO 26-04-29 19:28:41.019415 - 3:53:21 - step: 24720 acc: 0 loss: 1.5 grad: 1.40e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6014 data: 0.0723 lr: 3.76e-05 mem: 47% pow: 669.266 W 0: INFO 26-04-29 19:28:54.551285 - 3:53:35 - step: 24730 acc: 0 loss: 1.3893 grad: 1.70e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5971 data: 0.0872 lr: 3.76e-05 mem: 47% pow: 660.955 W 0: INFO 26-04-29 19:29:08.142545 - 3:53:48 - step: 24740 acc: 0 loss: 1.3878 grad: 1.48e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6063 data: 0.0867 lr: 3.76e-05 mem: 47% pow: 652.396 W 0: INFO 26-04-29 19:29:21.751586 - 3:54:02 - step: 24750 acc: 0 loss: 1.2901 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6129 data: 0.0811 lr: 3.76e-05 mem: 47% pow: 676.904 W 0: INFO 26-04-29 19:29:35.249707 - 3:54:16 - step: 24760 acc: 0 loss: 1.4549 grad: 1.49e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6084 data: 0.0811 lr: 3.76e-05 mem: 47% pow: 659.501 W 0: INFO 26-04-29 19:29:48.982442 - 3:54:29 - step: 24770 acc: 0 loss: 1.0775 grad: 1.42e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7187 data: 0.1223 lr: 3.75e-05 mem: 47% pow: 576.969 W 0: INFO 26-04-29 19:30:02.537866 - 3:54:43 - step: 24780 acc: 0 loss: 1.4177 grad: 1.48e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5974 data: 0.0949 lr: 3.75e-05 mem: 47% pow: 656.996 W 0: INFO 26-04-29 19:30:16.265260 - 3:54:57 - step: 24790 acc: 0 loss: 1.39 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6105 data: 0.0887 lr: 3.75e-05 mem: 47% pow: 643.168 W 0: INFO 26-04-29 19:30:30.160942 - 3:55:10 - step: 24800 acc: 0 loss: 1.4861 grad: 1.48e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5874 data: 0.0926 lr: 3.75e-05 mem: 47% pow: 658.573 W 0: INFO 26-04-29 19:30:46.716440 - 3:55:27 - step: 24810 acc: 0 loss: 1.5271 grad: 1.42e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6242 data: 0.0837 lr: 3.75e-05 mem: 54% pow: 649.152 W 0: INFO 26-04-29 19:31:00.283198 - 3:55:41 - step: 24820 acc: 0 loss: 1.7518 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5891 data: 0.0871 lr: 3.75e-05 mem: 47% pow: 658.001 W 0: INFO 26-04-29 19:31:14.053461 - 3:55:54 - step: 24830 acc: 0 loss: 1.3042 grad: 1.45e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5987 data: 0.0816 lr: 3.75e-05 mem: 47% pow: 664.936 W 0: INFO 26-04-29 19:31:27.661320 - 3:56:08 - step: 24840 acc: 0 loss: 1.6886 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6246 data: 0.0938 lr: 3.74e-05 mem: 47% pow: 633.957 W 0: INFO 26-04-29 19:31:41.404858 - 3:56:22 - step: 24850 acc: 0 loss: 1.434 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5974 data: 0.0868 lr: 3.74e-05 mem: 47% pow: 661.212 W 0: INFO 26-04-29 19:31:54.947802 - 3:56:35 - step: 24860 acc: 0 loss: 1.5369 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.607 data: 0.0941 lr: 3.74e-05 mem: 47% pow: 654.561 W 0: INFO 26-04-29 19:32:08.657273 - 3:56:49 - step: 24870 acc: 0 loss: 1.2088 grad: 1.37e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6141 data: 0.0552 lr: 3.74e-05 mem: 47% pow: 677.375 W 0: INFO 26-04-29 19:32:22.279337 - 3:57:03 - step: 24880 acc: 0 loss: 1.374 grad: 1.54e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6446 data: 0.0929 lr: 3.74e-05 mem: 47% pow: 634.17 W 0: INFO 26-04-29 19:32:35.910074 - 3:57:16 - step: 24890 acc: 0 loss: 1.504 grad: 1.50e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6302 data: 0.0967 lr: 3.74e-05 mem: 47% pow: 632.679 W 0: INFO 26-04-29 19:32:49.651229 - 3:57:30 - step: 24900 acc: 0 loss: 1.452 grad: 1.40e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.8144 data: 0.0919 lr: 3.74e-05 mem: 47% pow: 537.326 W 0: INFO 26-04-29 19:33:06.079307 - 3:57:46 - step: 24910 acc: 0 loss: 1.1502 grad: 1.46e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6198 data: 0.0719 lr: 3.73e-05 mem: 54% pow: 664.057 W 0: INFO 26-04-29 19:33:20.141914 - 3:58:00 - step: 24920 acc: 0 loss: 1.2791 grad: 1.45e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5956 data: 0.078 lr: 3.73e-05 mem: 47% pow: 665.166 W 0: INFO 26-04-29 19:33:34.079436 - 3:58:14 - step: 24930 acc: 0 loss: 1.3478 grad: 1.55e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.609 data: 0.0814 lr: 3.73e-05 mem: 47% pow: 661.835 W 0: INFO 26-04-29 19:33:47.990354 - 3:58:28 - step: 24940 acc: 0 loss: 1.3983 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5816 data: 0.1473 lr: 3.73e-05 mem: 47% pow: 636.97 W 0: INFO 26-04-29 19:34:01.672634 - 3:58:42 - step: 24950 acc: 0 loss: 1.4914 grad: 1.40e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6011 data: 0.0826 lr: 3.73e-05 mem: 47% pow: 658.857 W 0: INFO 26-04-29 19:34:15.312625 - 3:58:56 - step: 24960 acc: 0 loss: 0.9195 grad: 1.46e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5975 data: 0.1091 lr: 3.73e-05 mem: 47% pow: 656.145 W 0: INFO 26-04-29 19:34:28.958580 - 3:59:09 - step: 24970 acc: 0 loss: 1.3281 grad: 1.43e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6078 data: 0.0864 lr: 3.72e-05 mem: 47% pow: 659.547 W 0: INFO 26-04-29 19:34:42.901681 - 3:59:23 - step: 24980 acc: 0 loss: 1.4639 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.651 data: 0.0886 lr: 3.72e-05 mem: 47% pow: 626.842 W 0: INFO 26-04-29 19:34:56.752659 - 3:59:37 - step: 24990 acc: 0 loss: 1.3051 grad: 1.44e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6044 data: 0.0841 lr: 3.72e-05 mem: 47% pow: 661.265 W 0: INFO 26-04-29 19:35:10.455645 - 3:59:51 - step: 25000 acc: 0 loss: 1.6805 grad: 1.49e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6191 data: 0.0848 lr: 3.72e-05 mem: 47% pow: 657.184 W 0: INFO 26-04-29 19:35:10.458232 - 3:59:51 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000025000 0: INFO 26-04-29 19:35:10.458802 - 3:59:51 - Saving... 0: INFO 26-04-29 19:35:16.170306 - 3:59:56 - State dict saved! 0: INFO 26-04-29 19:35:16.289761 - 3:59:57 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000025000/train_state_00000.json 0: INFO 26-04-29 19:35:16.293926 - 3:59:57 - Train state saved ! 0: INFO 26-04-29 19:35:16.294270 - 3:59:57 - Cleaning up checkpoints... 0: INFO 26-04-29 19:35:16.294469 - 3:59:57 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000020000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000025000')] 0: INFO 26-04-29 19:35:16.294634 - 3:59:57 - Eval folders: [] 0: INFO 26-04-29 19:35:16.294769 - 3:59:57 - Other folders: [] 0: INFO 26-04-29 19:35:16.295362 - 3:59:57 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000020000')} 0: INFO 26-04-29 19:35:20.440832 - 4:00:01 - garbage collection 0: INFO 26-04-29 19:35:34.980469 - 4:00:15 - step: 25010 acc: 0 loss: 1.3503 grad: 1.44e-01 flops: 2.30e+14 wps: 2.67e+04 iter: 0.63 data: 0.0677 lr: 3.72e-05 mem: 54% pow: 647.191 W 0: INFO 26-04-29 19:35:48.875742 - 4:00:29 - step: 25020 acc: 0 loss: 1.3281 grad: 1.40e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5972 data: 0.0958 lr: 3.72e-05 mem: 47% pow: 654.246 W 0: INFO 26-04-29 19:36:02.755075 - 4:00:43 - step: 25030 acc: 0 loss: 1.4346 grad: 1.50e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6377 data: 0.0739 lr: 3.72e-05 mem: 47% pow: 643.581 W 0: INFO 26-04-29 19:36:16.895649 - 4:00:57 - step: 25040 acc: 0 loss: 1.215 grad: 1.41e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6156 data: 0.0855 lr: 3.71e-05 mem: 47% pow: 650.199 W 0: INFO 26-04-29 19:36:30.649729 - 4:01:11 - step: 25050 acc: 0 loss: 1.2516 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6097 data: 0.0885 lr: 3.71e-05 mem: 47% pow: 645.256 W 0: INFO 26-04-29 19:36:44.529423 - 4:01:25 - step: 25060 acc: 0 loss: 1.2332 grad: 1.52e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6114 data: 0.0884 lr: 3.71e-05 mem: 47% pow: 649.687 W 0: INFO 26-04-29 19:36:58.043194 - 4:01:38 - step: 25070 acc: 0 loss: 1.0544 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.605 data: 0.0772 lr: 3.71e-05 mem: 47% pow: 665.663 W 0: INFO 26-04-29 19:37:11.662932 - 4:01:52 - step: 25080 acc: 0 loss: 1.1752 grad: 1.50e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5888 data: 0.0891 lr: 3.71e-05 mem: 47% pow: 656.727 W 0: INFO 26-04-29 19:37:25.861982 - 4:02:06 - step: 25090 acc: 0 loss: 1.5255 grad: 1.50e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5877 data: 0.0915 lr: 3.71e-05 mem: 47% pow: 656.899 W 0: INFO 26-04-29 19:37:39.701515 - 4:02:20 - step: 25100 acc: 0 loss: 1.8689 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6063 data: 0.0907 lr: 3.71e-05 mem: 47% pow: 650.325 W 0: INFO 26-04-29 19:37:56.585597 - 4:02:37 - step: 25110 acc: 0 loss: 1.3813 grad: 1.53e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.5909 data: 0.0907 lr: 3.70e-05 mem: 54% pow: 662.901 W 0: INFO 26-04-29 19:38:10.384826 - 4:02:51 - step: 25120 acc: 0 loss: 1.553 grad: 1.43e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6098 data: 0.0796 lr: 3.70e-05 mem: 47% pow: 660.199 W 0: INFO 26-04-29 19:38:23.950806 - 4:03:04 - step: 25130 acc: 0 loss: 1.2763 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6081 data: 0.0884 lr: 3.70e-05 mem: 47% pow: 659.816 W 0: INFO 26-04-29 19:38:37.732238 - 4:03:18 - step: 25140 acc: 0 loss: 1.3531 grad: 1.44e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5849 data: 0.0968 lr: 3.70e-05 mem: 47% pow: 663.51 W 0: INFO 26-04-29 19:38:51.834969 - 4:03:32 - step: 25150 acc: 0 loss: 1.2364 grad: 1.42e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.8344 data: 0.0719 lr: 3.70e-05 mem: 47% pow: 545.797 W 0: INFO 26-04-29 19:39:05.662700 - 4:03:46 - step: 25160 acc: 0 loss: 1.4577 grad: 1.52e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5841 data: 0.0958 lr: 3.70e-05 mem: 47% pow: 662.002 W 0: INFO 26-04-29 19:39:19.656586 - 4:04:00 - step: 25170 acc: 0 loss: 1.4037 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5972 data: 0.0866 lr: 3.69e-05 mem: 47% pow: 664.251 W 0: INFO 26-04-29 19:39:33.603480 - 4:04:14 - step: 25180 acc: 0 loss: 1.4067 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.674 data: 0.105 lr: 3.69e-05 mem: 47% pow: 605.958 W 0: INFO 26-04-29 19:39:47.202201 - 4:04:27 - step: 25190 acc: 0 loss: 1.4501 grad: 1.44e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6178 data: 0.0983 lr: 3.69e-05 mem: 47% pow: 651.852 W 0: INFO 26-04-29 19:40:01.479816 - 4:04:42 - step: 25200 acc: 0 loss: 1.4777 grad: 1.42e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.5997 data: 0.0888 lr: 3.69e-05 mem: 47% pow: 657.697 W 0: INFO 26-04-29 19:40:18.155934 - 4:04:58 - step: 25210 acc: 0 loss: 1.5416 grad: 1.49e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5778 data: 0.1112 lr: 3.69e-05 mem: 54% pow: 664.387 W 0: INFO 26-04-29 19:40:31.852265 - 4:05:12 - step: 25220 acc: 0 loss: 1.1182 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6005 data: 0.0778 lr: 3.69e-05 mem: 47% pow: 659.71 W 0: INFO 26-04-29 19:40:45.604421 - 4:05:26 - step: 25230 acc: 0 loss: 1.2753 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5952 data: 0.0867 lr: 3.69e-05 mem: 47% pow: 664.732 W 0: INFO 26-04-29 19:41:00.858240 - 4:05:41 - step: 25240 acc: 0 loss: 1.7585 grad: 1.51e-01 flops: 3.70e+14 wps: 4.30e+04 iter: 0.615 data: 0.0925 lr: 3.68e-05 mem: 47% pow: 652.619 W 0: INFO 26-04-29 19:41:14.767718 - 4:05:55 - step: 25250 acc: 0 loss: 1.5437 grad: 1.40e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6272 data: 0.0755 lr: 3.68e-05 mem: 47% pow: 645.681 W 0: INFO 26-04-29 19:41:28.778482 - 4:06:09 - step: 25260 acc: 0 loss: 1.4769 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6062 data: 0.0835 lr: 3.68e-05 mem: 47% pow: 662.368 W 0: INFO 26-04-29 19:41:42.521331 - 4:06:23 - step: 25270 acc: 0 loss: 1.3815 grad: 1.43e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.636 data: 0.0521 lr: 3.68e-05 mem: 47% pow: 667.136 W 0: INFO 26-04-29 19:41:56.504790 - 4:06:37 - step: 25280 acc: 0 loss: 1.2716 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6872 data: 0.0914 lr: 3.68e-05 mem: 47% pow: 597.322 W 0: INFO 26-04-29 19:42:10.530534 - 4:06:51 - step: 25290 acc: 0 loss: 1.5317 grad: 1.54e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5903 data: 0.0918 lr: 3.68e-05 mem: 47% pow: 658.393 W 0: INFO 26-04-29 19:42:24.806129 - 4:07:05 - step: 25300 acc: 0 loss: 1.922 grad: 1.49e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.7354 data: 0.0852 lr: 3.68e-05 mem: 47% pow: 585.611 W 0: INFO 26-04-29 19:42:41.773027 - 4:07:22 - step: 25310 acc: 0 loss: 1.1984 grad: 1.49e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.6269 data: 0.0902 lr: 3.67e-05 mem: 54% pow: 659.52 W 0: INFO 26-04-29 19:42:55.654249 - 4:07:36 - step: 25320 acc: 0 loss: 1.4332 grad: 1.55e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5857 data: 0.0855 lr: 3.67e-05 mem: 47% pow: 670.085 W 0: INFO 26-04-29 19:43:09.274121 - 4:07:50 - step: 25330 acc: 0 loss: 1.3498 grad: 1.43e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.612 data: 0.0915 lr: 3.67e-05 mem: 47% pow: 654.929 W 0: INFO 26-04-29 19:43:22.867293 - 4:08:03 - step: 25340 acc: 0 loss: 1.3147 grad: 1.45e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5925 data: 0.0917 lr: 3.67e-05 mem: 47% pow: 663.945 W 0: INFO 26-04-29 19:43:36.626143 - 4:08:17 - step: 25350 acc: 0 loss: 1.349 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6024 data: 0.0821 lr: 3.67e-05 mem: 47% pow: 663.126 W 0: INFO 26-04-29 19:43:50.334037 - 4:08:31 - step: 25360 acc: 0 loss: 1.4264 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6153 data: 0.0844 lr: 3.67e-05 mem: 47% pow: 660.974 W 0: INFO 26-04-29 19:44:04.054546 - 4:08:44 - step: 25370 acc: 0 loss: 1.1844 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6414 data: 0.091 lr: 3.67e-05 mem: 47% pow: 638.753 W 0: INFO 26-04-29 19:44:18.068435 - 4:08:58 - step: 25380 acc: 0 loss: 1.246 grad: 1.42e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5869 data: 0.096 lr: 3.66e-05 mem: 47% pow: 676.474 W 0: INFO 26-04-29 19:44:31.941655 - 4:09:12 - step: 25390 acc: 0 loss: 1.4473 grad: 1.55e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.624 data: 0.0777 lr: 3.66e-05 mem: 47% pow: 647.095 W 0: INFO 26-04-29 19:44:46.096481 - 4:09:26 - step: 25400 acc: 0 loss: 1.2875 grad: 1.61e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6867 data: 0.0818 lr: 3.66e-05 mem: 47% pow: 615.019 W 0: INFO 26-04-29 19:45:03.247065 - 4:09:44 - step: 25410 acc: 0 loss: 1.5491 grad: 1.51e-01 flops: 3.29e+14 wps: 3.82e+04 iter: 0.5784 data: 0.3059 lr: 3.66e-05 mem: 54% pow: 554.342 W 0: INFO 26-04-29 19:45:17.231648 - 4:09:58 - step: 25420 acc: 0 loss: 1.2448 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7599 data: 0.0893 lr: 3.66e-05 mem: 47% pow: 573.78 W 0: INFO 26-04-29 19:45:31.328265 - 4:10:12 - step: 25430 acc: 0 loss: 1.4472 grad: 1.46e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.8108 data: 0.067 lr: 3.66e-05 mem: 47% pow: 554.778 W 0: INFO 26-04-29 19:45:44.950706 - 4:10:25 - step: 25440 acc: 0 loss: 1.3662 grad: 1.46e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6574 data: 0.0904 lr: 3.65e-05 mem: 47% pow: 620.958 W 0: INFO 26-04-29 19:45:58.838090 - 4:10:39 - step: 25450 acc: 0 loss: 1.6902 grad: 1.41e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6141 data: 0.0915 lr: 3.65e-05 mem: 47% pow: 649.124 W 0: INFO 26-04-29 19:46:12.637612 - 4:10:53 - step: 25460 acc: 0 loss: 1.5093 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6644 data: 0.0921 lr: 3.65e-05 mem: 47% pow: 617.112 W 0: INFO 26-04-29 19:46:26.217644 - 4:11:07 - step: 25470 acc: 0 loss: 1.2645 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6734 data: 0.0754 lr: 3.65e-05 mem: 47% pow: 623.666 W 0: INFO 26-04-29 19:46:40.168996 - 4:11:20 - step: 25480 acc: 0 loss: 1.4271 grad: 1.40e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5992 data: 0.084 lr: 3.65e-05 mem: 47% pow: 661.879 W 0: INFO 26-04-29 19:46:53.900816 - 4:11:34 - step: 25490 acc: 0 loss: 1.3312 grad: 1.47e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6035 data: 0.0843 lr: 3.65e-05 mem: 47% pow: 667.052 W 0: INFO 26-04-29 19:47:07.849614 - 4:11:48 - step: 25500 acc: 0 loss: 1.011 grad: 1.40e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5895 data: 0.0837 lr: 3.65e-05 mem: 47% pow: 681.594 W 0: INFO 26-04-29 19:47:24.393888 - 4:12:05 - step: 25510 acc: 0 loss: 1.6095 grad: 1.45e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5881 data: 0.0906 lr: 3.64e-05 mem: 54% pow: 666.259 W 0: INFO 26-04-29 19:47:38.129194 - 4:12:18 - step: 25520 acc: 0 loss: 1.2259 grad: 1.45e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6326 data: 0.0876 lr: 3.64e-05 mem: 47% pow: 642.493 W 0: INFO 26-04-29 19:47:51.965528 - 4:12:32 - step: 25530 acc: 0 loss: 1.2414 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6126 data: 0.0939 lr: 3.64e-05 mem: 47% pow: 650.663 W 0: INFO 26-04-29 19:48:05.730202 - 4:12:46 - step: 25540 acc: 0 loss: 1.3395 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5792 data: 0.1446 lr: 3.64e-05 mem: 47% pow: 633.145 W 0: INFO 26-04-29 19:48:19.645698 - 4:13:00 - step: 25550 acc: 0 loss: 1.6764 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5983 data: 0.0867 lr: 3.64e-05 mem: 47% pow: 662.773 W 0: INFO 26-04-29 19:48:33.717545 - 4:13:14 - step: 25560 acc: 0 loss: 1.5082 grad: 1.41e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6425 data: 0.0749 lr: 3.64e-05 mem: 47% pow: 640.435 W 0: INFO 26-04-29 19:48:47.791356 - 4:13:28 - step: 25570 acc: 0 loss: 1.3338 grad: 1.54e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.8954 data: 0.0925 lr: 3.64e-05 mem: 47% pow: 499.689 W 0: INFO 26-04-29 19:49:01.405449 - 4:13:42 - step: 25580 acc: 0 loss: 1.3567 grad: 1.45e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5862 data: 0.0943 lr: 3.63e-05 mem: 47% pow: 659.248 W 0: INFO 26-04-29 19:49:15.122936 - 4:13:55 - step: 25590 acc: 0 loss: 1.702 grad: 1.52e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6097 data: 0.0735 lr: 3.63e-05 mem: 47% pow: 663.193 W 0: INFO 26-04-29 19:49:28.722878 - 4:14:09 - step: 25600 acc: 0 loss: 1.6728 grad: 1.43e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5958 data: 0.0865 lr: 3.63e-05 mem: 47% pow: 673.686 W 0: INFO 26-04-29 19:49:45.733968 - 4:14:26 - step: 25610 acc: 0 loss: 1.2966 grad: 1.65e-01 flops: 3.34e+14 wps: 3.87e+04 iter: 0.7279 data: 0.0841 lr: 3.63e-05 mem: 54% pow: 586.684 W 0: INFO 26-04-29 19:49:59.283681 - 4:14:40 - step: 25620 acc: 0 loss: 1.0721 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6039 data: 0.0807 lr: 3.63e-05 mem: 47% pow: 664.37 W 0: INFO 26-04-29 19:50:12.950867 - 4:14:53 - step: 25630 acc: 0 loss: 1.5846 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5974 data: 0.083 lr: 3.63e-05 mem: 47% pow: 661.033 W 0: INFO 26-04-29 19:50:26.696128 - 4:15:07 - step: 25640 acc: 0 loss: 1.5631 grad: 1.64e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6019 data: 0.0767 lr: 3.62e-05 mem: 47% pow: 664.33 W 0: INFO 26-04-29 19:50:40.357252 - 4:15:21 - step: 25650 acc: 0 loss: 1.4666 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6302 data: 0.0866 lr: 3.62e-05 mem: 47% pow: 641.217 W 0: INFO 26-04-29 19:50:54.179359 - 4:15:34 - step: 25660 acc: 0 loss: 1.4082 grad: 1.70e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6235 data: 0.0695 lr: 3.62e-05 mem: 47% pow: 658.523 W 0: INFO 26-04-29 19:51:07.893775 - 4:15:48 - step: 25670 acc: 0 loss: 1.7682 grad: 1.61e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5927 data: 0.0858 lr: 3.62e-05 mem: 47% pow: 665.385 W 0: INFO 26-04-29 19:51:21.567328 - 4:16:02 - step: 25680 acc: 0 loss: 1.3968 grad: 1.57e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5834 data: 0.0951 lr: 3.62e-05 mem: 47% pow: 662.343 W 0: INFO 26-04-29 19:51:35.275811 - 4:16:16 - step: 25690 acc: 0 loss: 1.5167 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6188 data: 0.0909 lr: 3.62e-05 mem: 47% pow: 654.548 W 0: INFO 26-04-29 19:51:49.384669 - 4:16:30 - step: 25700 acc: 0 loss: 1.4005 grad: 1.43e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6165 data: 0.0866 lr: 3.62e-05 mem: 47% pow: 653.644 W 0: INFO 26-04-29 19:52:05.953589 - 4:16:46 - step: 25710 acc: 0 loss: 1.0261 grad: 2.07e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6258 data: 0.0847 lr: 3.61e-05 mem: 54% pow: 639.06 W 0: INFO 26-04-29 19:52:19.557498 - 4:17:00 - step: 25720 acc: 0 loss: 1.4228 grad: 1.81e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.588 data: 0.1096 lr: 3.61e-05 mem: 47% pow: 653.852 W 0: INFO 26-04-29 19:52:33.140693 - 4:17:13 - step: 25730 acc: 0 loss: 1.435 grad: 1.63e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.588 data: 0.0917 lr: 3.61e-05 mem: 47% pow: 654.491 W 0: INFO 26-04-29 19:52:47.141993 - 4:17:27 - step: 25740 acc: 0 loss: 1.4534 grad: 1.58e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6294 data: 0.0885 lr: 3.61e-05 mem: 47% pow: 635.76 W 0: INFO 26-04-29 19:53:00.722431 - 4:17:41 - step: 25750 acc: 0 loss: 1.0088 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5868 data: 0.0878 lr: 3.61e-05 mem: 47% pow: 670.341 W 0: INFO 26-04-29 19:53:14.723372 - 4:17:55 - step: 25760 acc: 0 loss: 1.3106 grad: 1.45e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6497 data: 0.0851 lr: 3.61e-05 mem: 47% pow: 636.887 W 0: INFO 26-04-29 19:53:28.453378 - 4:18:09 - step: 25770 acc: 0 loss: 1.5699 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.607 data: 0.0889 lr: 3.61e-05 mem: 47% pow: 647.037 W 0: INFO 26-04-29 19:53:42.153823 - 4:18:22 - step: 25780 acc: 0 loss: 1.3469 grad: 1.50e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6063 data: 0.0848 lr: 3.60e-05 mem: 47% pow: 659.593 W 0: INFO 26-04-29 19:53:55.803244 - 4:18:36 - step: 25790 acc: 0 loss: 1.3426 grad: 1.49e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6284 data: 0.0559 lr: 3.60e-05 mem: 47% pow: 663.917 W 0: INFO 26-04-29 19:54:09.136279 - 4:18:49 - step: 25800 acc: 0 loss: 1.2094 grad: 1.57e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.5885 data: 0.0897 lr: 3.60e-05 mem: 47% pow: 668.565 W 0: INFO 26-04-29 19:54:25.814009 - 4:19:06 - step: 25810 acc: 0 loss: 1.4372 grad: 1.55e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5819 data: 0.0883 lr: 3.60e-05 mem: 54% pow: 668.761 W 0: INFO 26-04-29 19:54:39.624911 - 4:19:20 - step: 25820 acc: 0 loss: 1.4632 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.604 data: 0.1127 lr: 3.60e-05 mem: 47% pow: 639.67 W 0: INFO 26-04-29 19:54:53.458321 - 4:19:34 - step: 25830 acc: 0 loss: 1.3146 grad: 1.49e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7084 data: 0.0883 lr: 3.60e-05 mem: 47% pow: 589.573 W 0: INFO 26-04-29 19:55:07.083597 - 4:19:47 - step: 25840 acc: 0 loss: 1.3667 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6838 data: 0.018 lr: 3.60e-05 mem: 47% pow: 651.651 W 0: INFO 26-04-29 19:55:20.690460 - 4:20:01 - step: 25850 acc: 0 loss: 1.2062 grad: 1.72e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5914 data: 0.0824 lr: 3.59e-05 mem: 47% pow: 692.133 W 0: INFO 26-04-29 19:55:34.463054 - 4:20:15 - step: 25860 acc: 0 loss: 1.2687 grad: 1.59e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5869 data: 0.0984 lr: 3.59e-05 mem: 47% pow: 660.619 W 0: INFO 26-04-29 19:55:48.058572 - 4:20:28 - step: 25870 acc: 0 loss: 1.7185 grad: 1.58e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.587 data: 0.0902 lr: 3.59e-05 mem: 47% pow: 664.571 W 0: INFO 26-04-29 19:56:01.523965 - 4:20:42 - step: 25880 acc: 0 loss: 1.3898 grad: 1.52e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6264 data: 0.0585 lr: 3.59e-05 mem: 47% pow: 664.49 W 0: INFO 26-04-29 19:56:15.324650 - 4:20:56 - step: 25890 acc: 0 loss: 1.1302 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5942 data: 0.0853 lr: 3.59e-05 mem: 47% pow: 654.651 W 0: INFO 26-04-29 19:56:28.915736 - 4:21:09 - step: 25900 acc: 0 loss: 1.5636 grad: 1.52e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5881 data: 0.0837 lr: 3.59e-05 mem: 47% pow: 661.516 W 0: INFO 26-04-29 19:56:46.542871 - 4:21:27 - step: 25910 acc: 0 loss: 1.7231 grad: 1.57e-01 flops: 3.20e+14 wps: 3.72e+04 iter: 0.6574 data: 0.0873 lr: 3.58e-05 mem: 54% pow: 622.778 W 0: INFO 26-04-29 19:57:00.123719 - 4:21:40 - step: 25920 acc: 0 loss: 1.3887 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5996 data: 0.0867 lr: 3.58e-05 mem: 47% pow: 656.334 W 0: INFO 26-04-29 19:57:13.600459 - 4:21:54 - step: 25930 acc: 0 loss: 1.31 grad: 1.54e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5949 data: 0.0882 lr: 3.58e-05 mem: 47% pow: 662.656 W 0: INFO 26-04-29 19:57:27.130793 - 4:22:07 - step: 25940 acc: 0 loss: 1.2768 grad: 1.69e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5928 data: 0.0877 lr: 3.58e-05 mem: 47% pow: 660.673 W 0: INFO 26-04-29 19:57:41.007320 - 4:22:21 - step: 25950 acc: 0 loss: 1.3944 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6025 data: 0.0682 lr: 3.58e-05 mem: 47% pow: 672.71 W 0: INFO 26-04-29 19:57:54.430407 - 4:22:35 - step: 25960 acc: 0 loss: 1.6334 grad: 1.54e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6259 data: 0.0613 lr: 3.58e-05 mem: 47% pow: 666.052 W 0: INFO 26-04-29 19:58:08.118554 - 4:22:48 - step: 25970 acc: 0 loss: 1.6387 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6609 data: 0.089 lr: 3.58e-05 mem: 47% pow: 628.624 W 0: INFO 26-04-29 19:58:21.733782 - 4:23:02 - step: 25980 acc: 0 loss: 1.3227 grad: 1.51e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.599 data: 0.0911 lr: 3.57e-05 mem: 47% pow: 676.873 W 0: INFO 26-04-29 19:58:35.266279 - 4:23:16 - step: 25990 acc: 0 loss: 1.462 grad: 1.65e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5999 data: 0.0796 lr: 3.57e-05 mem: 47% pow: 657.681 W 0: INFO 26-04-29 19:58:49.226386 - 4:23:30 - step: 26000 acc: 0 loss: 1.5217 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7704 data: 0.0969 lr: 3.57e-05 mem: 47% pow: 568.635 W 0: INFO 26-04-29 19:58:53.004852 - 4:23:33 - garbage collection 0: INFO 26-04-29 19:59:07.380309 - 4:23:48 - step: 26010 acc: 0 loss: 1.2618 grad: 1.66e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.5985 data: 0.0834 lr: 3.57e-05 mem: 54% pow: 664.625 W 0: INFO 26-04-29 19:59:21.235299 - 4:24:02 - step: 26020 acc: 0 loss: 1.3563 grad: 1.52e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.7109 data: 0.0778 lr: 3.57e-05 mem: 47% pow: 617.138 W 0: INFO 26-04-29 19:59:34.824847 - 4:24:15 - step: 26030 acc: 0 loss: 1.4713 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6068 data: 0.0876 lr: 3.57e-05 mem: 47% pow: 655.645 W 0: INFO 26-04-29 19:59:48.520062 - 4:24:29 - step: 26040 acc: 0 loss: 1.2161 grad: 1.46e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5914 data: 0.0882 lr: 3.57e-05 mem: 47% pow: 661.928 W 0: INFO 26-04-29 20:00:02.227288 - 4:24:43 - step: 26050 acc: 0 loss: 1.3471 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5858 data: 0.094 lr: 3.56e-05 mem: 47% pow: 655.114 W 0: INFO 26-04-29 20:00:15.928654 - 4:24:56 - step: 26060 acc: 0 loss: 1.4206 grad: 1.66e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5848 data: 0.0877 lr: 3.56e-05 mem: 47% pow: 676.188 W 0: INFO 26-04-29 20:00:29.517255 - 4:25:10 - step: 26070 acc: 0 loss: 1.5883 grad: 1.52e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5862 data: 0.0936 lr: 3.56e-05 mem: 47% pow: 655.573 W 0: INFO 26-04-29 20:00:43.220437 - 4:25:24 - step: 26080 acc: 0 loss: 1.3492 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5982 data: 0.0869 lr: 3.56e-05 mem: 47% pow: 663.88 W 0: INFO 26-04-29 20:00:57.041087 - 4:25:37 - step: 26090 acc: 0 loss: 1.2907 grad: 1.57e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6284 data: 0.074 lr: 3.56e-05 mem: 47% pow: 650.41 W 0: INFO 26-04-29 20:01:10.823292 - 4:25:51 - step: 26100 acc: 0 loss: 1.6237 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5983 data: 0.079 lr: 3.56e-05 mem: 47% pow: 656.539 W 0: INFO 26-04-29 20:01:27.404563 - 4:26:08 - step: 26110 acc: 0 loss: 1.2707 grad: 1.46e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6213 data: 0.0784 lr: 3.55e-05 mem: 54% pow: 660.184 W 0: INFO 26-04-29 20:01:41.415184 - 4:26:22 - step: 26120 acc: 0 loss: 1.6269 grad: 1.70e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.7401 data: 0.0834 lr: 3.55e-05 mem: 47% pow: 590.468 W 0: INFO 26-04-29 20:01:55.017364 - 4:26:35 - step: 26130 acc: 0 loss: 1.4364 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5913 data: 0.1001 lr: 3.55e-05 mem: 47% pow: 668.038 W 0: INFO 26-04-29 20:02:08.839711 - 4:26:49 - step: 26140 acc: 0 loss: 1.3618 grad: 1.55e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6043 data: 0.0917 lr: 3.55e-05 mem: 47% pow: 654.753 W 0: INFO 26-04-29 20:02:22.499597 - 4:27:03 - step: 26150 acc: 0 loss: 1.3206 grad: 1.77e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5886 data: 0.0908 lr: 3.55e-05 mem: 47% pow: 663.823 W 0: INFO 26-04-29 20:02:36.114036 - 4:27:16 - step: 26160 acc: 0 loss: 1.6162 grad: 2.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6651 data: 0.0896 lr: 3.55e-05 mem: 47% pow: 614.533 W 0: INFO 26-04-29 20:02:50.096468 - 4:27:30 - step: 26170 acc: 0 loss: 1.3604 grad: 1.69e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5812 data: 0.1323 lr: 3.55e-05 mem: 47% pow: 646.023 W 0: INFO 26-04-29 20:03:03.634283 - 4:27:44 - step: 26180 acc: 0 loss: 1.2333 grad: 1.67e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6285 data: 0.088 lr: 3.54e-05 mem: 47% pow: 637.188 W 0: INFO 26-04-29 20:03:17.475414 - 4:27:58 - step: 26190 acc: 0 loss: 1.1617 grad: 1.61e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6046 data: 0.0884 lr: 3.54e-05 mem: 47% pow: 656.574 W 0: INFO 26-04-29 20:03:30.966243 - 4:28:11 - step: 26200 acc: 0 loss: 1.1945 grad: 1.66e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6137 data: 0.0693 lr: 3.54e-05 mem: 47% pow: 665.47 W 0: INFO 26-04-29 20:03:47.781481 - 4:28:28 - step: 26210 acc: 0 loss: 1.4114 grad: 1.61e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6125 data: 0.0761 lr: 3.54e-05 mem: 54% pow: 669.422 W 0: INFO 26-04-29 20:04:01.733734 - 4:28:42 - step: 26220 acc: 0 loss: 1.6078 grad: 1.66e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7043 data: 0.0916 lr: 3.54e-05 mem: 47% pow: 596.076 W 0: INFO 26-04-29 20:04:15.522225 - 4:28:56 - step: 26230 acc: 0 loss: 1.0883 grad: 1.52e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.7954 data: 0.0849 lr: 3.54e-05 mem: 47% pow: 552.211 W 0: INFO 26-04-29 20:04:29.154782 - 4:29:09 - step: 26240 acc: 0 loss: 1.4249 grad: 1.73e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6092 data: 0.0873 lr: 3.54e-05 mem: 47% pow: 650.75 W 0: INFO 26-04-29 20:04:42.965528 - 4:29:23 - step: 26250 acc: 0 loss: 1.7438 grad: 1.57e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.62 data: 0.0866 lr: 3.53e-05 mem: 47% pow: 655.763 W 0: INFO 26-04-29 20:04:56.581230 - 4:29:37 - step: 26260 acc: 0 loss: 1.3189 grad: 1.56e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6655 data: 0.0881 lr: 3.53e-05 mem: 47% pow: 631.211 W 0: INFO 26-04-29 20:05:10.435786 - 4:29:51 - step: 26270 acc: 0 loss: 1.7533 grad: 1.70e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5831 data: 0.0946 lr: 3.53e-05 mem: 47% pow: 663.596 W 0: INFO 26-04-29 20:05:24.002315 - 4:30:04 - step: 26280 acc: 0 loss: 1.1713 grad: 1.72e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6187 data: 0.0764 lr: 3.53e-05 mem: 47% pow: 648.289 W 0: INFO 26-04-29 20:05:37.882926 - 4:30:18 - step: 26290 acc: 0 loss: 1.497 grad: 1.65e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6079 data: 0.0888 lr: 3.53e-05 mem: 47% pow: 651.876 W 0: INFO 26-04-29 20:05:51.612712 - 4:30:32 - step: 26300 acc: 0 loss: 1.4513 grad: 1.60e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6103 data: 0.1018 lr: 3.53e-05 mem: 47% pow: 666.572 W 0: INFO 26-04-29 20:06:08.463341 - 4:30:49 - step: 26310 acc: 0 loss: 1.4777 grad: 1.77e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6237 data: 0.0826 lr: 3.53e-05 mem: 54% pow: 649.81 W 0: INFO 26-04-29 20:06:22.185528 - 4:31:02 - step: 26320 acc: 0 loss: 1.0869 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6033 data: 0.0816 lr: 3.52e-05 mem: 47% pow: 666.082 W 0: INFO 26-04-29 20:06:35.980639 - 4:31:16 - step: 26330 acc: 0 loss: 1.0925 grad: 1.57e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5997 data: 0.0843 lr: 3.52e-05 mem: 47% pow: 660.709 W 0: INFO 26-04-29 20:06:49.396659 - 4:31:30 - step: 26340 acc: 0 loss: 1.1452 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6008 data: 0.0791 lr: 3.52e-05 mem: 47% pow: 656.758 W 0: INFO 26-04-29 20:07:03.094082 - 4:31:43 - step: 26350 acc: 0 loss: 1.2831 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6405 data: 0.086 lr: 3.52e-05 mem: 47% pow: 632.567 W 0: INFO 26-04-29 20:07:16.824512 - 4:31:57 - step: 26360 acc: 0 loss: 1.328 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6431 data: 0.084 lr: 3.52e-05 mem: 47% pow: 640.765 W 0: INFO 26-04-29 20:07:30.385897 - 4:32:11 - step: 26370 acc: 0 loss: 1.3076 grad: 1.57e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5985 data: 0.0856 lr: 3.52e-05 mem: 47% pow: 664.481 W 0: INFO 26-04-29 20:07:43.882006 - 4:32:24 - step: 26380 acc: 0 loss: 1.4724 grad: 1.68e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5905 data: 0.0876 lr: 3.51e-05 mem: 47% pow: 667.305 W 0: INFO 26-04-29 20:07:57.590713 - 4:32:38 - step: 26390 acc: 0 loss: 1.2865 grad: 1.64e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5803 data: 0.1312 lr: 3.51e-05 mem: 47% pow: 659.039 W 0: INFO 26-04-29 20:08:11.407399 - 4:32:52 - step: 26400 acc: 0 loss: 1.2369 grad: 1.66e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6118 data: 0.0861 lr: 3.51e-05 mem: 47% pow: 672.954 W 0: INFO 26-04-29 20:08:27.827142 - 4:33:08 - step: 26410 acc: 0 loss: 1.5349 grad: 1.65e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6199 data: 0.0867 lr: 3.51e-05 mem: 54% pow: 646.5 W 0: INFO 26-04-29 20:08:41.471723 - 4:33:22 - step: 26420 acc: 0 loss: 1.2741 grad: 1.58e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6013 data: 0.0893 lr: 3.51e-05 mem: 47% pow: 656.643 W 0: INFO 26-04-29 20:08:55.152009 - 4:33:35 - step: 26430 acc: 0 loss: 1.0891 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5895 data: 0.0856 lr: 3.51e-05 mem: 47% pow: 661.918 W 0: INFO 26-04-29 20:09:09.304245 - 4:33:50 - step: 26440 acc: 0 loss: 1.4618 grad: 1.66e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6351 data: 0.0792 lr: 3.51e-05 mem: 47% pow: 643.71 W 0: INFO 26-04-29 20:09:23.127320 - 4:34:03 - step: 26450 acc: 0 loss: 1.5602 grad: 1.65e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5809 data: 0.0851 lr: 3.50e-05 mem: 47% pow: 677.08 W 0: INFO 26-04-29 20:09:36.695743 - 4:34:17 - step: 26460 acc: 0 loss: 1.2031 grad: 1.59e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6067 data: 0.0904 lr: 3.50e-05 mem: 47% pow: 643.942 W 0: INFO 26-04-29 20:09:50.327385 - 4:34:31 - step: 26470 acc: 0 loss: 1.1239 grad: 1.67e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6118 data: 0.0875 lr: 3.50e-05 mem: 47% pow: 642.647 W 0: INFO 26-04-29 20:10:04.418827 - 4:34:45 - step: 26480 acc: 0 loss: 1.1899 grad: 2.18e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6485 data: 0.0813 lr: 3.50e-05 mem: 47% pow: 630.906 W 0: INFO 26-04-29 20:10:18.021613 - 4:34:58 - step: 26490 acc: 0 loss: 1.129 grad: 1.62e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6205 data: 0.1041 lr: 3.50e-05 mem: 47% pow: 633.843 W 0: INFO 26-04-29 20:10:31.594701 - 4:35:12 - step: 26500 acc: 0 loss: 1.3537 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6321 data: 0.0757 lr: 3.50e-05 mem: 47% pow: 653.445 W 0: INFO 26-04-29 20:10:48.214513 - 4:35:29 - step: 26510 acc: 0 loss: 1.1906 grad: 1.81e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6337 data: 0.0809 lr: 3.50e-05 mem: 54% pow: 643.466 W 0: INFO 26-04-29 20:11:01.687810 - 4:35:42 - step: 26520 acc: 0 loss: 1.3233 grad: 1.62e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6231 data: 0.0862 lr: 3.49e-05 mem: 47% pow: 642.286 W 0: INFO 26-04-29 20:11:15.334028 - 4:35:56 - step: 26530 acc: 0 loss: 1.1771 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5957 data: 0.0863 lr: 3.49e-05 mem: 47% pow: 660.607 W 0: INFO 26-04-29 20:11:29.093125 - 4:36:09 - step: 26540 acc: 0 loss: 1.1608 grad: 1.65e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6061 data: 0.0812 lr: 3.49e-05 mem: 47% pow: 669.659 W 0: INFO 26-04-29 20:11:42.677885 - 4:36:23 - step: 26550 acc: 0 loss: 1.5204 grad: 1.59e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6093 data: 0.0692 lr: 3.49e-05 mem: 47% pow: 660.543 W 0: INFO 26-04-29 20:11:56.395438 - 4:36:37 - step: 26560 acc: 0 loss: 1.4767 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5855 data: 0.083 lr: 3.49e-05 mem: 47% pow: 663.524 W 0: INFO 26-04-29 20:12:10.541958 - 4:36:51 - step: 26570 acc: 0 loss: 1.3651 grad: 1.85e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6127 data: 0.085 lr: 3.49e-05 mem: 47% pow: 653.486 W 0: INFO 26-04-29 20:12:24.181253 - 4:37:04 - step: 26580 acc: 0 loss: 1.1535 grad: 1.62e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6092 data: 0.094 lr: 3.49e-05 mem: 47% pow: 645.775 W 0: INFO 26-04-29 20:12:38.178680 - 4:37:18 - step: 26590 acc: 0 loss: 1.2869 grad: 6.31e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6025 data: 0.0926 lr: 3.48e-05 mem: 47% pow: 658.185 W 0: INFO 26-04-29 20:12:51.919401 - 4:37:32 - step: 26600 acc: 0 loss: 1.1841 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.593 data: 0.0908 lr: 3.48e-05 mem: 47% pow: 665.736 W 0: INFO 26-04-29 20:13:08.559656 - 4:37:49 - step: 26610 acc: 0 loss: 1.4956 grad: 1.60e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6167 data: 0.0897 lr: 3.48e-05 mem: 54% pow: 646.873 W 0: INFO 26-04-29 20:13:22.169569 - 4:38:02 - step: 26620 acc: 0 loss: 1.3986 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.626 data: 0.0765 lr: 3.48e-05 mem: 47% pow: 648.311 W 0: INFO 26-04-29 20:13:35.954735 - 4:38:16 - step: 26630 acc: 0 loss: 1.4796 grad: 2.34e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5778 data: 0.0992 lr: 3.48e-05 mem: 47% pow: 661.575 W 0: INFO 26-04-29 20:13:49.557578 - 4:38:30 - step: 26640 acc: 0 loss: 1.3446 grad: 1.73e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5908 data: 0.0884 lr: 3.48e-05 mem: 47% pow: 659.932 W 0: INFO 26-04-29 20:14:03.367002 - 4:38:44 - step: 26650 acc: 0 loss: 1.3071 grad: 1.69e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6056 data: 0.0836 lr: 3.47e-05 mem: 47% pow: 658.29 W 0: INFO 26-04-29 20:14:17.049395 - 4:38:57 - step: 26660 acc: 0 loss: 1.2634 grad: 1.71e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.581 data: 0.1027 lr: 3.47e-05 mem: 47% pow: 656.932 W 0: INFO 26-04-29 20:14:30.753477 - 4:39:11 - step: 26670 acc: 0 loss: 1.3257 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7386 data: 0.0765 lr: 3.47e-05 mem: 47% pow: 585.736 W 0: INFO 26-04-29 20:14:44.256334 - 4:39:25 - step: 26680 acc: 0 loss: 1.2947 grad: 1.82e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6035 data: 0.0839 lr: 3.47e-05 mem: 47% pow: 654.013 W 0: INFO 26-04-29 20:14:57.911710 - 4:39:38 - step: 26690 acc: 0 loss: 1.2101 grad: 1.66e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6615 data: 0.0912 lr: 3.47e-05 mem: 47% pow: 626.885 W 0: INFO 26-04-29 20:15:11.337288 - 4:39:52 - step: 26700 acc: 0 loss: 1.4144 grad: 1.65e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.59 data: 0.0891 lr: 3.47e-05 mem: 47% pow: 655.445 W 0: INFO 26-04-29 20:15:27.997530 - 4:40:08 - step: 26710 acc: 0 loss: 1.2856 grad: 1.63e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6888 data: 0.0795 lr: 3.47e-05 mem: 54% pow: 613.534 W 0: INFO 26-04-29 20:15:41.638824 - 4:40:22 - step: 26720 acc: 0 loss: 1.566 grad: 1.69e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5907 data: 0.0896 lr: 3.46e-05 mem: 47% pow: 660.532 W 0: INFO 26-04-29 20:15:55.368913 - 4:40:36 - step: 26730 acc: 0 loss: 1.5775 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6137 data: 0.0755 lr: 3.46e-05 mem: 47% pow: 654.852 W 0: INFO 26-04-29 20:16:08.945782 - 4:40:49 - step: 26740 acc: 0 loss: 1.4694 grad: 1.74e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6171 data: 0.0872 lr: 3.46e-05 mem: 47% pow: 647.185 W 0: INFO 26-04-29 20:16:22.536029 - 4:41:03 - step: 26750 acc: 0 loss: 1.7801 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5901 data: 0.0889 lr: 3.46e-05 mem: 47% pow: 663.173 W 0: INFO 26-04-29 20:16:36.212485 - 4:41:17 - step: 26760 acc: 0 loss: 1.4718 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5976 data: 0.0954 lr: 3.46e-05 mem: 47% pow: 659.94 W 0: INFO 26-04-29 20:16:49.755618 - 4:41:30 - step: 26770 acc: 0 loss: 1.3263 grad: 1.71e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5856 data: 0.087 lr: 3.46e-05 mem: 47% pow: 674.063 W 0: INFO 26-04-29 20:17:03.478462 - 4:41:44 - step: 26780 acc: 0 loss: 1.5476 grad: 1.81e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6278 data: 0.0913 lr: 3.46e-05 mem: 47% pow: 636.507 W 0: INFO 26-04-29 20:17:16.895847 - 4:41:57 - step: 26790 acc: 0 loss: 1.1144 grad: 1.58e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5912 data: 0.086 lr: 3.45e-05 mem: 47% pow: 667.035 W 0: INFO 26-04-29 20:17:30.445420 - 4:42:11 - step: 26800 acc: 0 loss: 1.3188 grad: 1.63e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6698 data: 0.0658 lr: 3.45e-05 mem: 47% pow: 626.76 W 0: INFO 26-04-29 20:17:46.896134 - 4:42:27 - step: 26810 acc: 0 loss: 1.1677 grad: 1.66e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5918 data: 0.0836 lr: 3.45e-05 mem: 54% pow: 666.625 W 0: INFO 26-04-29 20:18:00.601755 - 4:42:41 - step: 26820 acc: 0 loss: 1.1665 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5987 data: 0.0771 lr: 3.45e-05 mem: 47% pow: 658.063 W 0: INFO 26-04-29 20:18:14.141231 - 4:42:54 - step: 26830 acc: 0 loss: 1.7633 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5818 data: 0.096 lr: 3.45e-05 mem: 47% pow: 663.729 W 0: INFO 26-04-29 20:18:27.545265 - 4:43:08 - step: 26840 acc: 0 loss: 1.1757 grad: 1.57e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5921 data: 0.087 lr: 3.45e-05 mem: 47% pow: 657.256 W 0: INFO 26-04-29 20:18:41.102435 - 4:43:21 - step: 26850 acc: 0 loss: 1.3564 grad: 1.57e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5986 data: 0.083 lr: 3.44e-05 mem: 47% pow: 658.241 W 0: INFO 26-04-29 20:18:54.656810 - 4:43:35 - step: 26860 acc: 0 loss: 1.2515 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6217 data: 0.0841 lr: 3.44e-05 mem: 47% pow: 651.673 W 0: INFO 26-04-29 20:19:08.209332 - 4:43:49 - step: 26870 acc: 0 loss: 1.4028 grad: 1.74e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6163 data: 0.0802 lr: 3.44e-05 mem: 47% pow: 662.669 W 0: INFO 26-04-29 20:19:21.791889 - 4:44:02 - step: 26880 acc: 0 loss: 1.255 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5824 data: 0.088 lr: 3.44e-05 mem: 47% pow: 670.441 W 0: INFO 26-04-29 20:19:35.282178 - 4:44:16 - step: 26890 acc: 0 loss: 1.2312 grad: 1.58e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6158 data: 0.0905 lr: 3.44e-05 mem: 47% pow: 648.393 W 0: INFO 26-04-29 20:19:48.854840 - 4:44:29 - step: 26900 acc: 0 loss: 0.9775 grad: 1.82e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6444 data: 0.0658 lr: 3.44e-05 mem: 47% pow: 658.776 W 0: INFO 26-04-29 20:20:05.545911 - 4:44:46 - step: 26910 acc: 0 loss: 1.4731 grad: 1.67e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6103 data: 0.1115 lr: 3.44e-05 mem: 54% pow: 633.495 W 0: INFO 26-04-29 20:20:19.562810 - 4:45:00 - step: 26920 acc: 0 loss: 1.3143 grad: 1.57e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6903 data: 0.0836 lr: 3.43e-05 mem: 47% pow: 609.6 W 0: INFO 26-04-29 20:20:33.665900 - 4:45:14 - step: 26930 acc: 0 loss: 1.3896 grad: 1.63e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6485 data: 0.087 lr: 3.43e-05 mem: 47% pow: 632.097 W 0: INFO 26-04-29 20:20:47.378859 - 4:45:28 - step: 26940 acc: 0 loss: 1.1631 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6924 data: 0.0824 lr: 3.43e-05 mem: 47% pow: 609.198 W 0: INFO 26-04-29 20:21:00.869443 - 4:45:41 - step: 26950 acc: 0 loss: 1.4602 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5987 data: 0.0825 lr: 3.43e-05 mem: 47% pow: 667.753 W 0: INFO 26-04-29 20:21:14.473397 - 4:45:55 - step: 26960 acc: 0 loss: 1.6692 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5904 data: 0.0876 lr: 3.43e-05 mem: 47% pow: 691.433 W 0: INFO 26-04-29 20:21:28.013285 - 4:46:08 - step: 26970 acc: 0 loss: 1.0294 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5914 data: 0.0992 lr: 3.43e-05 mem: 47% pow: 664.733 W 0: INFO 26-04-29 20:21:41.533565 - 4:46:22 - step: 26980 acc: 0 loss: 1.4862 grad: 1.51e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5985 data: 0.0791 lr: 3.43e-05 mem: 47% pow: 662.09 W 0: INFO 26-04-29 20:21:55.338227 - 4:46:36 - step: 26990 acc: 0 loss: 1.3455 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5925 data: 0.0885 lr: 3.42e-05 mem: 47% pow: 654.053 W 0: INFO 26-04-29 20:22:09.141289 - 4:46:49 - step: 27000 acc: 0 loss: 1.3405 grad: 1.71e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6083 data: 0.0899 lr: 3.42e-05 mem: 47% pow: 650.829 W 0: INFO 26-04-29 20:22:12.872838 - 4:46:53 - garbage collection 0: INFO 26-04-29 20:22:27.406602 - 4:47:08 - step: 27010 acc: 0 loss: 1.3537 grad: 1.61e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.5991 data: 0.0861 lr: 3.42e-05 mem: 54% pow: 660.755 W 0: INFO 26-04-29 20:22:40.945736 - 4:47:21 - step: 27020 acc: 0 loss: 1.2706 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.604 data: 0.0902 lr: 3.42e-05 mem: 47% pow: 660.212 W 0: INFO 26-04-29 20:22:54.561270 - 4:47:35 - step: 27030 acc: 0 loss: 1.5335 grad: 1.58e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6025 data: 0.0805 lr: 3.42e-05 mem: 47% pow: 680.78 W 0: INFO 26-04-29 20:23:08.314173 - 4:47:49 - step: 27040 acc: 0 loss: 1.1621 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6297 data: 0.0896 lr: 3.42e-05 mem: 47% pow: 654.397 W 0: INFO 26-04-29 20:23:21.798413 - 4:48:02 - step: 27050 acc: 0 loss: 1.3381 grad: 1.61e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6006 data: 0.091 lr: 3.42e-05 mem: 47% pow: 654.096 W 0: INFO 26-04-29 20:23:35.395003 - 4:48:16 - step: 27060 acc: 0 loss: 1.4586 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6476 data: 0.086 lr: 3.41e-05 mem: 47% pow: 650.1 W 0: INFO 26-04-29 20:23:49.607578 - 4:48:30 - step: 27070 acc: 0 loss: 1.1529 grad: 1.55e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6083 data: 0.0879 lr: 3.41e-05 mem: 47% pow: 661.495 W 0: INFO 26-04-29 20:24:03.494400 - 4:48:44 - step: 27080 acc: 0 loss: 1.3543 grad: 1.69e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6062 data: 0.094 lr: 3.41e-05 mem: 47% pow: 652.837 W 0: INFO 26-04-29 20:24:17.061756 - 4:48:57 - step: 27090 acc: 0 loss: 1.2793 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6237 data: 0.0908 lr: 3.41e-05 mem: 47% pow: 633.338 W 0: INFO 26-04-29 20:24:30.688231 - 4:49:11 - step: 27100 acc: 0 loss: 1.3272 grad: 1.62e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5995 data: 0.0945 lr: 3.41e-05 mem: 47% pow: 655.789 W 0: INFO 26-04-29 20:24:47.235000 - 4:49:28 - step: 27110 acc: 0 loss: 1.3689 grad: 1.58e-01 flops: 3.42e+14 wps: 3.96e+04 iter: 0.6026 data: 0.0975 lr: 3.41e-05 mem: 54% pow: 648.417 W 0: INFO 26-04-29 20:25:00.919878 - 4:49:41 - step: 27120 acc: 0 loss: 1.4336 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5938 data: 0.0972 lr: 3.40e-05 mem: 47% pow: 670.531 W 0: INFO 26-04-29 20:25:14.628612 - 4:49:55 - step: 27130 acc: 0 loss: 1.1277 grad: 1.63e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.656 data: 0.0372 lr: 3.40e-05 mem: 47% pow: 662.585 W 0: INFO 26-04-29 20:25:28.353673 - 4:50:09 - step: 27140 acc: 0 loss: 1.2799 grad: 2.01e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5792 data: 0.1257 lr: 3.40e-05 mem: 47% pow: 650.758 W 0: INFO 26-04-29 20:25:41.890994 - 4:50:22 - step: 27150 acc: 0 loss: 1.5425 grad: 2.32e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5921 data: 0.0906 lr: 3.40e-05 mem: 47% pow: 658.911 W 0: INFO 26-04-29 20:25:55.548447 - 4:50:36 - step: 27160 acc: 0 loss: 1.4748 grad: 2.19e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6231 data: 0.0898 lr: 3.40e-05 mem: 47% pow: 656.46 W 0: INFO 26-04-29 20:26:09.352602 - 4:50:50 - step: 27170 acc: 0 loss: 1.4461 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5836 data: 0.0933 lr: 3.40e-05 mem: 47% pow: 658.535 W 0: INFO 26-04-29 20:26:23.055504 - 4:51:03 - step: 27180 acc: 0 loss: 1.369 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6967 data: 0.0916 lr: 3.40e-05 mem: 47% pow: 605.638 W 0: INFO 26-04-29 20:26:38.345248 - 4:51:19 - step: 27190 acc: 0 loss: 1.4728 grad: 1.56e-01 flops: 3.70e+14 wps: 4.29e+04 iter: 0.6182 data: 0.0895 lr: 3.39e-05 mem: 47% pow: 646.126 W 0: INFO 26-04-29 20:26:51.939153 - 4:51:32 - step: 27200 acc: 0 loss: 1.2833 grad: 1.58e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5925 data: 0.0928 lr: 3.39e-05 mem: 47% pow: 666.849 W 0: INFO 26-04-29 20:27:08.558343 - 4:51:49 - step: 27210 acc: 0 loss: 1.4107 grad: 1.57e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.5902 data: 0.0937 lr: 3.39e-05 mem: 54% pow: 672.365 W 0: INFO 26-04-29 20:27:22.044661 - 4:52:02 - step: 27220 acc: 0 loss: 1.2691 grad: 1.61e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6064 data: 0.0826 lr: 3.39e-05 mem: 47% pow: 658.05 W 0: INFO 26-04-29 20:27:35.756577 - 4:52:16 - step: 27230 acc: 0 loss: 1.4746 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5992 data: 0.0903 lr: 3.39e-05 mem: 47% pow: 661.73 W 0: INFO 26-04-29 20:27:49.311807 - 4:52:30 - step: 27240 acc: 0 loss: 1.1824 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6384 data: 0.0841 lr: 3.39e-05 mem: 47% pow: 635.13 W 0: INFO 26-04-29 20:28:03.035801 - 4:52:43 - step: 27250 acc: 0 loss: 1.1291 grad: 1.70e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.612 data: 0.1032 lr: 3.39e-05 mem: 47% pow: 643.721 W 0: INFO 26-04-29 20:28:16.573991 - 4:52:57 - step: 27260 acc: 0 loss: 1.4116 grad: 1.59e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6121 data: 0.0939 lr: 3.38e-05 mem: 47% pow: 651.951 W 0: INFO 26-04-29 20:28:30.272111 - 4:53:11 - step: 27270 acc: 0 loss: 1.4942 grad: 1.62e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6468 data: 0.098 lr: 3.38e-05 mem: 47% pow: 621.062 W 0: INFO 26-04-29 20:28:44.068726 - 4:53:24 - step: 27280 acc: 0 loss: 1.5306 grad: 1.57e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.657 data: 0.079 lr: 3.38e-05 mem: 47% pow: 627.521 W 0: INFO 26-04-29 20:28:57.481834 - 4:53:38 - step: 27290 acc: 0 loss: 1.1364 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6051 data: 0.0812 lr: 3.38e-05 mem: 47% pow: 667.698 W 0: INFO 26-04-29 20:29:11.214882 - 4:53:52 - step: 27300 acc: 0 loss: 1.1859 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6008 data: 0.085 lr: 3.38e-05 mem: 47% pow: 660.768 W 0: INFO 26-04-29 20:29:27.894790 - 4:54:08 - step: 27310 acc: 0 loss: 1.2112 grad: 1.56e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5834 data: 0.0872 lr: 3.38e-05 mem: 54% pow: 670.932 W 0: INFO 26-04-29 20:29:41.520141 - 4:54:22 - step: 27320 acc: 0 loss: 1.2674 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.7067 data: 0.0819 lr: 3.37e-05 mem: 47% pow: 611.076 W 0: INFO 26-04-29 20:29:55.246183 - 4:54:36 - step: 27330 acc: 0 loss: 1.3821 grad: 1.62e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6505 data: 0.0667 lr: 3.37e-05 mem: 47% pow: 635.522 W 0: INFO 26-04-29 20:30:08.828918 - 4:54:49 - step: 27340 acc: 0 loss: 1.0749 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.581 data: 0.0907 lr: 3.37e-05 mem: 47% pow: 675.465 W 0: INFO 26-04-29 20:30:22.715073 - 4:55:03 - step: 27350 acc: 0 loss: 1.4522 grad: 1.62e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5776 data: 0.1057 lr: 3.37e-05 mem: 47% pow: 661.026 W 0: INFO 26-04-29 20:30:36.521861 - 4:55:17 - step: 27360 acc: 0 loss: 1.3227 grad: 1.88e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6064 data: 0.0863 lr: 3.37e-05 mem: 47% pow: 659.427 W 0: INFO 26-04-29 20:30:50.374611 - 4:55:31 - step: 27370 acc: 0 loss: 1.0153 grad: 1.69e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5858 data: 0.0908 lr: 3.37e-05 mem: 47% pow: 666.026 W 0: INFO 26-04-29 20:31:04.323959 - 4:55:45 - step: 27380 acc: 0 loss: 1.392 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5952 data: 0.0896 lr: 3.37e-05 mem: 47% pow: 662.763 W 0: INFO 26-04-29 20:31:18.061079 - 4:55:58 - step: 27390 acc: 0 loss: 1.3079 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5932 data: 0.0962 lr: 3.36e-05 mem: 47% pow: 658.858 W 0: INFO 26-04-29 20:31:31.631681 - 4:56:12 - step: 27400 acc: 0 loss: 1.1685 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5983 data: 0.1134 lr: 3.36e-05 mem: 47% pow: 660.803 W 0: INFO 26-04-29 20:31:48.407700 - 4:56:29 - step: 27410 acc: 0 loss: 1.3117 grad: 1.57e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5852 data: 0.0925 lr: 3.36e-05 mem: 54% pow: 667.042 W 0: INFO 26-04-29 20:32:02.100669 - 4:56:42 - step: 27420 acc: 0 loss: 1.2024 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.594 data: 0.0892 lr: 3.36e-05 mem: 47% pow: 658.56 W 0: INFO 26-04-29 20:32:15.933444 - 4:56:56 - step: 27430 acc: 0 loss: 1.3026 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.636 data: 0.061 lr: 3.36e-05 mem: 47% pow: 662.906 W 0: INFO 26-04-29 20:32:29.535402 - 4:57:10 - step: 27440 acc: 0 loss: 1.1777 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5786 data: 0.1069 lr: 3.36e-05 mem: 47% pow: 661.587 W 0: INFO 26-04-29 20:32:43.242813 - 4:57:24 - step: 27450 acc: 0 loss: 1.2011 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6174 data: 0.0892 lr: 3.36e-05 mem: 47% pow: 651.227 W 0: INFO 26-04-29 20:32:57.006829 - 4:57:37 - step: 27460 acc: 0 loss: 1.5506 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6057 data: 0.092 lr: 3.35e-05 mem: 47% pow: 658.9 W 0: INFO 26-04-29 20:33:10.738685 - 4:57:51 - step: 27470 acc: 0 loss: 1.1129 grad: 1.60e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6016 data: 0.0931 lr: 3.35e-05 mem: 47% pow: 667.229 W 0: INFO 26-04-29 20:33:24.413898 - 4:58:05 - step: 27480 acc: 0 loss: 1.2566 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.602 data: 0.0816 lr: 3.35e-05 mem: 47% pow: 661.607 W 0: INFO 26-04-29 20:33:38.011422 - 4:58:18 - step: 27490 acc: 0 loss: 1.1495 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6303 data: 0.0852 lr: 3.35e-05 mem: 47% pow: 633.393 W 0: INFO 26-04-29 20:33:51.867804 - 4:58:32 - step: 27500 acc: 0 loss: 1.4663 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6133 data: 0.084 lr: 3.35e-05 mem: 47% pow: 642.176 W 0: INFO 26-04-29 20:34:08.815618 - 4:58:49 - step: 27510 acc: 0 loss: 1.1354 grad: 1.55e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.5949 data: 0.0883 lr: 3.35e-05 mem: 54% pow: 666.975 W 0: INFO 26-04-29 20:34:22.533572 - 4:59:03 - step: 27520 acc: 0 loss: 1.1081 grad: 1.62e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5865 data: 0.089 lr: 3.35e-05 mem: 47% pow: 667.171 W 0: INFO 26-04-29 20:34:36.294542 - 4:59:17 - step: 27530 acc: 0 loss: 1.4892 grad: 1.64e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6353 data: 0.0893 lr: 3.34e-05 mem: 47% pow: 629.529 W 0: INFO 26-04-29 20:34:50.362689 - 4:59:31 - step: 27540 acc: 0 loss: 1.0275 grad: 1.82e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5885 data: 0.0895 lr: 3.34e-05 mem: 47% pow: 655.187 W 0: INFO 26-04-29 20:35:04.195927 - 4:59:44 - step: 27550 acc: 0 loss: 1.2066 grad: 1.52e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6076 data: 0.09 lr: 3.34e-05 mem: 47% pow: 662.197 W 0: INFO 26-04-29 20:35:17.950241 - 4:59:58 - step: 27560 acc: 0 loss: 1.3677 grad: 1.54e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6033 data: 0.0877 lr: 3.34e-05 mem: 47% pow: 654.322 W 0: INFO 26-04-29 20:35:31.997528 - 5:00:12 - step: 27570 acc: 0 loss: 1.3105 grad: 1.64e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.637 data: 0.0881 lr: 3.34e-05 mem: 47% pow: 642.053 W 0: INFO 26-04-29 20:35:45.572130 - 5:00:26 - step: 27580 acc: 0 loss: 0.9102 grad: 1.67e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.592 data: 0.0824 lr: 3.34e-05 mem: 47% pow: 667.074 W 0: INFO 26-04-29 20:35:59.375824 - 5:00:40 - step: 27590 acc: 0 loss: 1.6275 grad: 1.46e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5966 data: 0.1052 lr: 3.33e-05 mem: 47% pow: 657.573 W 0: INFO 26-04-29 20:36:13.013058 - 5:00:53 - step: 27600 acc: 0 loss: 1.3899 grad: 1.48e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6111 data: 0.09 lr: 3.33e-05 mem: 47% pow: 643.31 W 0: INFO 26-04-29 20:36:29.713788 - 5:01:10 - step: 27610 acc: 0 loss: 1.1832 grad: 1.69e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6287 data: 0.0897 lr: 3.33e-05 mem: 54% pow: 641.353 W 0: INFO 26-04-29 20:36:43.658611 - 5:01:24 - step: 27620 acc: 0 loss: 1.279 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5853 data: 0.1017 lr: 3.33e-05 mem: 47% pow: 672.357 W 0: INFO 26-04-29 20:36:58.179102 - 5:01:38 - step: 27630 acc: 0 loss: 1.1072 grad: 2.00e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6125 data: 0.0923 lr: 3.33e-05 mem: 47% pow: 646.683 W 0: INFO 26-04-29 20:37:12.111896 - 5:01:52 - step: 27640 acc: 0 loss: 1.4846 grad: 1.55e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.5951 data: 0.085 lr: 3.33e-05 mem: 47% pow: 659.524 W 0: INFO 26-04-29 20:37:26.169508 - 5:02:06 - step: 27650 acc: 0 loss: 1.3401 grad: 1.72e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5968 data: 0.0919 lr: 3.33e-05 mem: 47% pow: 658.026 W 0: INFO 26-04-29 20:37:39.876933 - 5:02:20 - step: 27660 acc: 0 loss: 1.2441 grad: 1.82e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.593 data: 0.0885 lr: 3.32e-05 mem: 47% pow: 660.821 W 0: INFO 26-04-29 20:37:53.784249 - 5:02:34 - step: 27670 acc: 0 loss: 1.5736 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6114 data: 0.0769 lr: 3.32e-05 mem: 47% pow: 661.639 W 0: INFO 26-04-29 20:38:07.445572 - 5:02:48 - step: 27680 acc: 0 loss: 1.3188 grad: 1.53e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6219 data: 0.0855 lr: 3.32e-05 mem: 47% pow: 649.22 W 0: INFO 26-04-29 20:38:21.196333 - 5:03:01 - step: 27690 acc: 0 loss: 1.5841 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6019 data: 0.0831 lr: 3.32e-05 mem: 47% pow: 660.315 W 0: INFO 26-04-29 20:38:35.205711 - 5:03:16 - step: 27700 acc: 0 loss: 1.5009 grad: 1.48e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.8015 data: 0.082 lr: 3.32e-05 mem: 47% pow: 548.992 W 0: INFO 26-04-29 20:38:51.685738 - 5:03:32 - step: 27710 acc: 0 loss: 1.3812 grad: 1.62e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.614 data: 0.0798 lr: 3.32e-05 mem: 54% pow: 652.663 W 0: INFO 26-04-29 20:39:05.139875 - 5:03:45 - step: 27720 acc: 0 loss: 1.447 grad: 1.58e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6025 data: 0.0783 lr: 3.32e-05 mem: 47% pow: 656.384 W 0: INFO 26-04-29 20:39:19.048581 - 5:03:59 - step: 27730 acc: 0 loss: 1.5735 grad: 1.55e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.613 data: 0.0749 lr: 3.31e-05 mem: 47% pow: 658.86 W 0: INFO 26-04-29 20:39:32.863700 - 5:04:13 - step: 27740 acc: 0 loss: 1.3921 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5944 data: 0.0897 lr: 3.31e-05 mem: 47% pow: 664.792 W 0: INFO 26-04-29 20:39:46.775646 - 5:04:27 - step: 27750 acc: 0 loss: 1.382 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5936 data: 0.0881 lr: 3.31e-05 mem: 47% pow: 665.971 W 0: INFO 26-04-29 20:40:00.531842 - 5:04:41 - step: 27760 acc: 0 loss: 1.2052 grad: 1.70e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6033 data: 0.0902 lr: 3.31e-05 mem: 47% pow: 648.795 W 0: INFO 26-04-29 20:40:14.429830 - 5:04:55 - step: 27770 acc: 0 loss: 1.3721 grad: 1.66e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.8097 data: 0.0824 lr: 3.31e-05 mem: 47% pow: 543.536 W 0: INFO 26-04-29 20:40:28.355766 - 5:05:09 - step: 27780 acc: 0 loss: 1.4882 grad: 1.51e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5817 data: 0.0827 lr: 3.31e-05 mem: 47% pow: 676.243 W 0: INFO 26-04-29 20:40:42.122144 - 5:05:22 - step: 27790 acc: 0 loss: 1.3514 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5953 data: 0.0876 lr: 3.30e-05 mem: 47% pow: 663.624 W 0: INFO 26-04-29 20:40:56.191457 - 5:05:36 - step: 27800 acc: 0 loss: 1.4219 grad: 1.62e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6653 data: 0.0845 lr: 3.30e-05 mem: 47% pow: 624.136 W 0: INFO 26-04-29 20:41:13.157863 - 5:05:53 - step: 27810 acc: 0 loss: 1.1435 grad: 1.72e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.5942 data: 0.0902 lr: 3.30e-05 mem: 54% pow: 658.321 W 0: INFO 26-04-29 20:41:26.764672 - 5:06:07 - step: 27820 acc: 0 loss: 1.457 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6172 data: 0.0888 lr: 3.30e-05 mem: 47% pow: 654.539 W 0: INFO 26-04-29 20:41:40.464485 - 5:06:21 - step: 27830 acc: 0 loss: 1.4039 grad: 1.55e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5962 data: 0.0869 lr: 3.30e-05 mem: 47% pow: 666.821 W 0: INFO 26-04-29 20:41:54.363569 - 5:06:35 - step: 27840 acc: 0 loss: 1.4136 grad: 1.65e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6205 data: 0.0898 lr: 3.30e-05 mem: 47% pow: 645.816 W 0: INFO 26-04-29 20:42:08.253300 - 5:06:49 - step: 27850 acc: 0 loss: 1.8276 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6563 data: 0.0879 lr: 3.30e-05 mem: 47% pow: 626.495 W 0: INFO 26-04-29 20:42:21.989788 - 5:07:02 - step: 27860 acc: 0 loss: 1.8176 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7029 data: 0.0874 lr: 3.29e-05 mem: 47% pow: 606.652 W 0: INFO 26-04-29 20:42:36.120582 - 5:07:16 - step: 27870 acc: 0 loss: 1.5714 grad: 1.65e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5876 data: 0.1013 lr: 3.29e-05 mem: 47% pow: 663.493 W 0: INFO 26-04-29 20:42:49.825503 - 5:07:30 - step: 27880 acc: 0 loss: 1.1609 grad: 4.29e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6021 data: 0.0838 lr: 3.29e-05 mem: 47% pow: 660.165 W 0: INFO 26-04-29 20:43:03.672443 - 5:07:44 - step: 27890 acc: 0 loss: 1.2726 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5989 data: 0.0873 lr: 3.29e-05 mem: 47% pow: 674.616 W 0: INFO 26-04-29 20:43:17.339717 - 5:07:58 - step: 27900 acc: 0 loss: 1.1497 grad: 1.57e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5956 data: 0.0892 lr: 3.29e-05 mem: 47% pow: 665.89 W 0: INFO 26-04-29 20:43:34.102396 - 5:08:14 - step: 27910 acc: 0 loss: 1.3602 grad: 1.54e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.607 data: 0.0859 lr: 3.29e-05 mem: 54% pow: 660.25 W 0: INFO 26-04-29 20:43:47.749887 - 5:08:28 - step: 27920 acc: 0 loss: 1.1713 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6061 data: 0.0693 lr: 3.29e-05 mem: 47% pow: 666.207 W 0: INFO 26-04-29 20:44:01.458893 - 5:08:42 - step: 27930 acc: 0 loss: 1.8779 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6636 data: 0.0911 lr: 3.28e-05 mem: 47% pow: 616.522 W 0: INFO 26-04-29 20:44:15.180891 - 5:08:55 - step: 27940 acc: 0 loss: 1.2609 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6782 data: 0.11 lr: 3.28e-05 mem: 47% pow: 599.068 W 0: INFO 26-04-29 20:44:28.742040 - 5:09:09 - step: 27950 acc: 0 loss: 1.3241 grad: 1.61e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5932 data: 0.0871 lr: 3.28e-05 mem: 47% pow: 684.635 W 0: INFO 26-04-29 20:44:42.593144 - 5:09:23 - step: 27960 acc: 0 loss: 1.5915 grad: 1.84e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6077 data: 0.0881 lr: 3.28e-05 mem: 47% pow: 658.917 W 0: INFO 26-04-29 20:44:56.290453 - 5:09:37 - step: 27970 acc: 0 loss: 1.1758 grad: 1.58e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5909 data: 0.0843 lr: 3.28e-05 mem: 47% pow: 680.813 W 0: INFO 26-04-29 20:45:10.269594 - 5:09:51 - step: 27980 acc: 0 loss: 1.5004 grad: 1.63e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5914 data: 0.0799 lr: 3.28e-05 mem: 47% pow: 667.788 W 0: INFO 26-04-29 20:45:24.197160 - 5:10:04 - step: 27990 acc: 0 loss: 1.1422 grad: 1.55e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6181 data: 0.0658 lr: 3.28e-05 mem: 47% pow: 659.966 W 0: INFO 26-04-29 20:45:38.273959 - 5:10:19 - step: 28000 acc: 0 loss: 1.3533 grad: 1.60e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5956 data: 0.0961 lr: 3.27e-05 mem: 47% pow: 655.632 W 0: INFO 26-04-29 20:45:42.017076 - 5:10:22 - garbage collection 0: INFO 26-04-29 20:45:56.346007 - 5:10:37 - step: 28010 acc: 0 loss: 1.3204 grad: 1.61e-01 flops: 3.13e+14 wps: 3.63e+04 iter: 0.6207 data: 0.0847 lr: 3.27e-05 mem: 54% pow: 655.01 W 0: INFO 26-04-29 20:46:10.300905 - 5:10:51 - step: 28020 acc: 0 loss: 1.5324 grad: 1.71e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6012 data: 0.0993 lr: 3.27e-05 mem: 47% pow: 648.43 W 0: INFO 26-04-29 20:46:24.222537 - 5:11:05 - step: 28030 acc: 0 loss: 1.4772 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.598 data: 0.0868 lr: 3.27e-05 mem: 47% pow: 662.459 W 0: INFO 26-04-29 20:46:37.938450 - 5:11:18 - step: 28040 acc: 0 loss: 1.5914 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5946 data: 0.085 lr: 3.27e-05 mem: 47% pow: 669.34 W 0: INFO 26-04-29 20:46:51.781623 - 5:11:32 - step: 28050 acc: 0 loss: 1.1804 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.597 data: 0.1004 lr: 3.27e-05 mem: 47% pow: 646.167 W 0: INFO 26-04-29 20:47:05.581779 - 5:11:46 - step: 28060 acc: 0 loss: 1.1446 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5803 data: 0.0889 lr: 3.26e-05 mem: 47% pow: 683.203 W 0: INFO 26-04-29 20:47:19.414975 - 5:12:00 - step: 28070 acc: 0 loss: 1.1715 grad: 1.59e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.592 data: 0.0841 lr: 3.26e-05 mem: 47% pow: 661.513 W 0: INFO 26-04-29 20:47:33.118982 - 5:12:13 - step: 28080 acc: 0 loss: 1.5056 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6076 data: 0.0754 lr: 3.26e-05 mem: 47% pow: 666.938 W 0: INFO 26-04-29 20:47:46.861103 - 5:12:27 - step: 28090 acc: 0 loss: 1.1689 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.598 data: 0.0795 lr: 3.26e-05 mem: 47% pow: 668.932 W 0: INFO 26-04-29 20:48:00.726814 - 5:12:41 - step: 28100 acc: 0 loss: 1.4939 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.617 data: 0.0854 lr: 3.26e-05 mem: 47% pow: 649.148 W 0: INFO 26-04-29 20:48:17.516980 - 5:12:58 - step: 28110 acc: 0 loss: 1.6613 grad: 1.51e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6681 data: 0.09 lr: 3.26e-05 mem: 54% pow: 618.264 W 0: INFO 26-04-29 20:48:31.346538 - 5:13:12 - step: 28120 acc: 0 loss: 1.0786 grad: 1.59e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6229 data: 0.0895 lr: 3.26e-05 mem: 47% pow: 648.076 W 0: INFO 26-04-29 20:48:45.182798 - 5:13:25 - step: 28130 acc: 0 loss: 0.9727 grad: 1.80e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5993 data: 0.0883 lr: 3.25e-05 mem: 47% pow: 654.086 W 0: INFO 26-04-29 20:48:58.881780 - 5:13:39 - step: 28140 acc: 0 loss: 1.555 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6144 data: 0.1006 lr: 3.25e-05 mem: 47% pow: 647.915 W 0: INFO 26-04-29 20:49:12.526037 - 5:13:53 - step: 28150 acc: 0 loss: 1.2951 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6231 data: 0.0871 lr: 3.25e-05 mem: 47% pow: 651.703 W 0: INFO 26-04-29 20:49:26.289140 - 5:14:07 - step: 28160 acc: 0 loss: 1.2099 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6088 data: 0.0643 lr: 3.25e-05 mem: 47% pow: 665.982 W 0: INFO 26-04-29 20:49:40.617140 - 5:14:21 - step: 28170 acc: 0 loss: 1.5214 grad: 1.63e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.5822 data: 0.0954 lr: 3.25e-05 mem: 47% pow: 665.287 W 0: INFO 26-04-29 20:49:54.044181 - 5:14:34 - step: 28180 acc: 0 loss: 1.1509 grad: 1.61e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5874 data: 0.0944 lr: 3.25e-05 mem: 47% pow: 661.37 W 0: INFO 26-04-29 20:50:08.176417 - 5:14:48 - step: 28190 acc: 0 loss: 1.2974 grad: 1.58e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6159 data: 0.0795 lr: 3.25e-05 mem: 47% pow: 659.107 W 0: INFO 26-04-29 20:50:21.808506 - 5:15:02 - step: 28200 acc: 0 loss: 1.6968 grad: 1.56e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6381 data: 0.0893 lr: 3.24e-05 mem: 47% pow: 634.927 W 0: INFO 26-04-29 20:50:38.371847 - 5:15:19 - step: 28210 acc: 0 loss: 1.3137 grad: 1.56e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.601 data: 0.0846 lr: 3.24e-05 mem: 54% pow: 675.802 W 0: INFO 26-04-29 20:50:52.301645 - 5:15:33 - step: 28220 acc: 0 loss: 1.5578 grad: 1.64e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6246 data: 0.0803 lr: 3.24e-05 mem: 47% pow: 653.047 W 0: INFO 26-04-29 20:51:06.192619 - 5:15:46 - step: 28230 acc: 0 loss: 1.2641 grad: 1.67e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6653 data: 0.0886 lr: 3.24e-05 mem: 47% pow: 630.243 W 0: INFO 26-04-29 20:51:20.155195 - 5:16:00 - step: 28240 acc: 0 loss: 1.2643 grad: 1.85e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5963 data: 0.0829 lr: 3.24e-05 mem: 47% pow: 655.805 W 0: INFO 26-04-29 20:51:34.062399 - 5:16:14 - step: 28250 acc: 0 loss: 1.437 grad: 1.78e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5951 data: 0.0794 lr: 3.24e-05 mem: 47% pow: 667.525 W 0: INFO 26-04-29 20:51:47.874633 - 5:16:28 - step: 28260 acc: 0 loss: 1.1903 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5991 data: 0.0763 lr: 3.24e-05 mem: 47% pow: 668.18 W 0: INFO 26-04-29 20:52:01.664088 - 5:16:42 - step: 28270 acc: 0 loss: 1.042 grad: 1.70e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6476 data: 0.085 lr: 3.23e-05 mem: 47% pow: 639.268 W 0: INFO 26-04-29 20:52:15.341537 - 5:16:56 - step: 28280 acc: 0 loss: 1.7814 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6207 data: 0.0905 lr: 3.23e-05 mem: 47% pow: 642.224 W 0: INFO 26-04-29 20:52:29.067875 - 5:17:09 - step: 28290 acc: 0 loss: 1.1274 grad: 1.73e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5774 data: 0.1078 lr: 3.23e-05 mem: 47% pow: 658.087 W 0: INFO 26-04-29 20:52:42.545547 - 5:17:23 - step: 28300 acc: 0 loss: 1.4676 grad: 1.66e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5786 data: 0.1599 lr: 3.23e-05 mem: 47% pow: 626.343 W 0: INFO 26-04-29 20:52:59.225455 - 5:17:40 - step: 28310 acc: 0 loss: 1.2791 grad: 1.57e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.62 data: 0.105 lr: 3.23e-05 mem: 54% pow: 637.617 W 0: INFO 26-04-29 20:53:12.941888 - 5:17:53 - step: 28320 acc: 0 loss: 1.6283 grad: 1.71e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5905 data: 0.0885 lr: 3.23e-05 mem: 47% pow: 659.899 W 0: INFO 26-04-29 20:53:26.691444 - 5:18:07 - step: 28330 acc: 0 loss: 1.8715 grad: 1.90e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5793 data: 0.142 lr: 3.22e-05 mem: 47% pow: 631.332 W 0: INFO 26-04-29 20:53:40.749447 - 5:18:21 - step: 28340 acc: 0 loss: 1.6529 grad: 1.68e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6373 data: 0.0695 lr: 3.22e-05 mem: 47% pow: 652.251 W 0: INFO 26-04-29 20:53:54.397289 - 5:18:35 - step: 28350 acc: 0 loss: 1.3535 grad: 1.69e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6058 data: 0.0833 lr: 3.22e-05 mem: 47% pow: 661.946 W 0: INFO 26-04-29 20:54:08.207286 - 5:18:49 - step: 28360 acc: 0 loss: 1.375 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.61 data: 0.0893 lr: 3.22e-05 mem: 47% pow: 651.481 W 0: INFO 26-04-29 20:54:21.968506 - 5:19:02 - step: 28370 acc: 0 loss: 1.2298 grad: 1.80e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6214 data: 0.0948 lr: 3.22e-05 mem: 47% pow: 647.535 W 0: INFO 26-04-29 20:54:35.578079 - 5:19:16 - step: 28380 acc: 0 loss: 1.3918 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5945 data: 0.0927 lr: 3.22e-05 mem: 47% pow: 664.687 W 0: INFO 26-04-29 20:54:49.546898 - 5:19:30 - step: 28390 acc: 0 loss: 1.888 grad: 1.58e-01 flops: 4.05e+14 wps: 4.69e+04 iter: 0.6519 data: 0.0815 lr: 3.22e-05 mem: 47% pow: 629.385 W 0: INFO 26-04-29 20:55:03.396608 - 5:19:44 - step: 28400 acc: 0 loss: 1.4963 grad: 1.74e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6379 data: 0.0552 lr: 3.21e-05 mem: 47% pow: 673.842 W 0: INFO 26-04-29 20:55:20.021275 - 5:20:00 - step: 28410 acc: 0 loss: 1.2754 grad: 1.90e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.5865 data: 0.0909 lr: 3.21e-05 mem: 54% pow: 662.476 W 0: INFO 26-04-29 20:55:33.979256 - 5:20:14 - step: 28420 acc: 0 loss: 1.3684 grad: 1.64e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5808 data: 0.1302 lr: 3.21e-05 mem: 47% pow: 647.693 W 0: INFO 26-04-29 20:55:47.927793 - 5:20:28 - step: 28430 acc: 0 loss: 1.3121 grad: 1.64e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7992 data: 0.0859 lr: 3.21e-05 mem: 47% pow: 557.123 W 0: INFO 26-04-29 20:56:01.877915 - 5:20:42 - step: 28440 acc: 0 loss: 1.4083 grad: 1.52e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7263 data: 0.0877 lr: 3.21e-05 mem: 47% pow: 585.835 W 0: INFO 26-04-29 20:56:15.409908 - 5:20:56 - step: 28450 acc: 0 loss: 1.3594 grad: 1.58e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.5903 data: 0.0918 lr: 3.21e-05 mem: 47% pow: 659.887 W 0: INFO 26-04-29 20:56:29.060744 - 5:21:09 - step: 28460 acc: 0 loss: 1.3121 grad: 1.62e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5991 data: 0.0856 lr: 3.21e-05 mem: 47% pow: 661.773 W 0: INFO 26-04-29 20:56:42.921630 - 5:21:23 - step: 28470 acc: 0 loss: 1.4193 grad: 1.66e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6184 data: 0.0907 lr: 3.20e-05 mem: 47% pow: 653.943 W 0: INFO 26-04-29 20:56:56.631315 - 5:21:37 - step: 28480 acc: 0 loss: 1.2893 grad: 1.68e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6034 data: 0.0826 lr: 3.20e-05 mem: 47% pow: 658.879 W 0: INFO 26-04-29 20:57:10.283843 - 5:21:51 - step: 28490 acc: 0 loss: 1.5753 grad: 1.64e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.611 data: 0.0873 lr: 3.20e-05 mem: 47% pow: 649.27 W 0: INFO 26-04-29 20:57:24.131672 - 5:22:04 - step: 28500 acc: 0 loss: 1.4888 grad: 1.59e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6032 data: 0.0826 lr: 3.20e-05 mem: 47% pow: 664.213 W 0: INFO 26-04-29 20:57:41.324800 - 5:22:22 - step: 28510 acc: 0 loss: 1.6125 grad: 1.78e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6977 data: 0.0823 lr: 3.20e-05 mem: 54% pow: 607.733 W 0: INFO 26-04-29 20:57:55.300853 - 5:22:36 - step: 28520 acc: 0 loss: 1.5621 grad: 1.60e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6059 data: 0.0893 lr: 3.20e-05 mem: 47% pow: 651.484 W 0: INFO 26-04-29 20:58:09.391782 - 5:22:50 - step: 28530 acc: 0 loss: 1.0722 grad: 1.67e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5963 data: 0.0853 lr: 3.19e-05 mem: 47% pow: 667.206 W 0: INFO 26-04-29 20:58:23.060878 - 5:23:03 - step: 28540 acc: 0 loss: 1.6309 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6229 data: 0.0615 lr: 3.19e-05 mem: 47% pow: 660.665 W 0: INFO 26-04-29 20:58:36.922015 - 5:23:17 - step: 28550 acc: 0 loss: 1.7089 grad: 1.60e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.599 data: 0.0872 lr: 3.19e-05 mem: 47% pow: 669.21 W 0: INFO 26-04-29 20:58:50.666354 - 5:23:31 - step: 28560 acc: 0 loss: 1.4811 grad: 1.87e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6373 data: 0.0499 lr: 3.19e-05 mem: 47% pow: 676.054 W 0: INFO 26-04-29 20:59:04.492588 - 5:23:45 - step: 28570 acc: 0 loss: 1.3575 grad: 1.57e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6404 data: 0.0862 lr: 3.19e-05 mem: 47% pow: 637.481 W 0: INFO 26-04-29 20:59:18.418134 - 5:23:59 - step: 28580 acc: 0 loss: 1.5138 grad: 1.84e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6013 data: 0.0868 lr: 3.19e-05 mem: 47% pow: 656.166 W 0: INFO 26-04-29 20:59:32.693940 - 5:24:13 - step: 28590 acc: 0 loss: 1.344 grad: 1.72e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5817 data: 0.0922 lr: 3.19e-05 mem: 47% pow: 664.405 W 0: INFO 26-04-29 20:59:46.486116 - 5:24:27 - step: 28600 acc: 0 loss: 1.4826 grad: 1.59e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6782 data: 0.0752 lr: 3.18e-05 mem: 47% pow: 620.604 W 0: INFO 26-04-29 21:00:03.444068 - 5:24:44 - step: 28610 acc: 0 loss: 1.7105 grad: 1.60e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6537 data: 0.0833 lr: 3.18e-05 mem: 54% pow: 626.29 W 0: INFO 26-04-29 21:00:17.254508 - 5:24:58 - step: 28620 acc: 0 loss: 1.8796 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.7127 data: 0.0882 lr: 3.18e-05 mem: 47% pow: 590.881 W 0: INFO 26-04-29 21:00:31.399941 - 5:25:12 - step: 28630 acc: 0 loss: 1.2437 grad: 1.64e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6545 data: 0.0905 lr: 3.18e-05 mem: 47% pow: 621.227 W 0: INFO 26-04-29 21:00:45.150477 - 5:25:25 - step: 28640 acc: 0 loss: 1.4602 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6046 data: 0.0943 lr: 3.18e-05 mem: 47% pow: 650.106 W 0: INFO 26-04-29 21:00:59.118578 - 5:25:39 - step: 28650 acc: 0 loss: 1.2351 grad: 1.71e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5793 data: 0.1071 lr: 3.18e-05 mem: 47% pow: 674.202 W 0: INFO 26-04-29 21:01:12.918719 - 5:25:53 - step: 28660 acc: 0 loss: 1.5225 grad: 1.69e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.605 data: 0.0859 lr: 3.18e-05 mem: 47% pow: 665.415 W 0: INFO 26-04-29 21:01:26.522417 - 5:26:07 - step: 28670 acc: 0 loss: 1.2676 grad: 1.74e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5964 data: 0.0881 lr: 3.17e-05 mem: 47% pow: 655.171 W 0: INFO 26-04-29 21:01:40.586782 - 5:26:21 - step: 28680 acc: 0 loss: 1.5885 grad: 1.64e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.702 data: 0.0889 lr: 3.17e-05 mem: 47% pow: 600.886 W 0: INFO 26-04-29 21:01:54.465665 - 5:26:35 - step: 28690 acc: 0 loss: 1.0392 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6213 data: 0.0887 lr: 3.17e-05 mem: 47% pow: 647.785 W 0: INFO 26-04-29 21:02:08.037608 - 5:26:48 - step: 28700 acc: 0 loss: 1.5609 grad: 1.59e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5959 data: 0.0885 lr: 3.17e-05 mem: 47% pow: 672.464 W 0: INFO 26-04-29 21:02:24.837211 - 5:27:05 - step: 28710 acc: 0 loss: 1.5267 grad: 1.60e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6767 data: 0.0873 lr: 3.17e-05 mem: 54% pow: 613.779 W 0: INFO 26-04-29 21:02:38.490663 - 5:27:19 - step: 28720 acc: 0 loss: 1.4874 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6074 data: 0.0862 lr: 3.17e-05 mem: 47% pow: 658.744 W 0: INFO 26-04-29 21:02:52.349597 - 5:27:33 - step: 28730 acc: 0 loss: 1.2401 grad: 1.67e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6752 data: 0.0199 lr: 3.17e-05 mem: 47% pow: 656.462 W 0: INFO 26-04-29 21:03:06.348374 - 5:27:47 - step: 28740 acc: 0 loss: 1.5441 grad: 1.49e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.5848 data: 0.0896 lr: 3.16e-05 mem: 47% pow: 667.725 W 0: INFO 26-04-29 21:03:20.035010 - 5:28:00 - step: 28750 acc: 0 loss: 1.002 grad: 1.62e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6174 data: 0.0826 lr: 3.16e-05 mem: 47% pow: 647.228 W 0: INFO 26-04-29 21:03:33.555624 - 5:28:14 - step: 28760 acc: 0 loss: 1.3115 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5955 data: 0.0821 lr: 3.16e-05 mem: 47% pow: 648.49 W 0: INFO 26-04-29 21:03:47.575070 - 5:28:28 - step: 28770 acc: 0 loss: 0.9996 grad: 1.89e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6089 data: 0.0951 lr: 3.16e-05 mem: 47% pow: 645.72 W 0: INFO 26-04-29 21:04:01.331072 - 5:28:42 - step: 28780 acc: 0 loss: 1.4273 grad: 1.59e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6548 data: 0.069 lr: 3.16e-05 mem: 47% pow: 643.331 W 0: INFO 26-04-29 21:04:15.307974 - 5:28:56 - step: 28790 acc: 0 loss: 1.3834 grad: 1.53e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7214 data: 0.0952 lr: 3.16e-05 mem: 47% pow: 586.174 W 0: INFO 26-04-29 21:04:28.973547 - 5:29:09 - step: 28800 acc: 0 loss: 1.6431 grad: 1.64e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6313 data: 0.0889 lr: 3.15e-05 mem: 47% pow: 636.026 W 0: INFO 26-04-29 21:04:45.684445 - 5:29:26 - step: 28810 acc: 0 loss: 1.2193 grad: 1.50e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6095 data: 0.0979 lr: 3.15e-05 mem: 54% pow: 652.967 W 0: INFO 26-04-29 21:04:59.298561 - 5:29:40 - step: 28820 acc: 0 loss: 1.0553 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6106 data: 0.0819 lr: 3.15e-05 mem: 47% pow: 659.729 W 0: INFO 26-04-29 21:05:13.348479 - 5:29:54 - step: 28830 acc: 0 loss: 1.139 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.7212 data: 0.0879 lr: 3.15e-05 mem: 47% pow: 589.39 W 0: INFO 26-04-29 21:05:26.921788 - 5:30:07 - step: 28840 acc: 0 loss: 0.961 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5927 data: 0.0875 lr: 3.15e-05 mem: 47% pow: 677.222 W 0: INFO 26-04-29 21:05:40.999575 - 5:30:21 - step: 28850 acc: 0 loss: 1.0956 grad: 1.49e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6023 data: 0.0855 lr: 3.15e-05 mem: 47% pow: 659.853 W 0: INFO 26-04-29 21:05:55.151315 - 5:30:35 - step: 28860 acc: 0 loss: 1.2911 grad: 1.52e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5842 data: 0.0951 lr: 3.15e-05 mem: 47% pow: 659.417 W 0: INFO 26-04-29 21:06:08.769733 - 5:30:49 - step: 28870 acc: 0 loss: 1.8171 grad: 1.59e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5844 data: 0.0909 lr: 3.14e-05 mem: 47% pow: 663.623 W 0: INFO 26-04-29 21:06:22.315043 - 5:31:03 - step: 28880 acc: 0 loss: 1.11 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5963 data: 0.0872 lr: 3.14e-05 mem: 47% pow: 655.255 W 0: INFO 26-04-29 21:06:35.957862 - 5:31:16 - step: 28890 acc: 0 loss: 1.516 grad: 1.63e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.611 data: 0.0711 lr: 3.14e-05 mem: 47% pow: 657.056 W 0: INFO 26-04-29 21:06:49.989557 - 5:31:30 - step: 28900 acc: 0 loss: 1.4837 grad: 1.51e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6042 data: 0.0832 lr: 3.14e-05 mem: 47% pow: 660.241 W 0: INFO 26-04-29 21:07:06.572901 - 5:31:47 - step: 28910 acc: 0 loss: 1.5651 grad: 1.65e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6169 data: 0.0728 lr: 3.14e-05 mem: 54% pow: 657.349 W 0: INFO 26-04-29 21:07:20.400657 - 5:32:01 - step: 28920 acc: 0 loss: 1.467 grad: 1.94e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6354 data: 0.0866 lr: 3.14e-05 mem: 47% pow: 639.652 W 0: INFO 26-04-29 21:07:34.323679 - 5:32:15 - step: 28930 acc: 0 loss: 1.5831 grad: 1.56e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6199 data: 0.0903 lr: 3.14e-05 mem: 47% pow: 649.143 W 0: INFO 26-04-29 21:07:49.779256 - 5:32:30 - step: 28940 acc: 0 loss: 1.1856 grad: 1.60e-01 flops: 3.65e+14 wps: 4.24e+04 iter: 0.6167 data: 0.089 lr: 3.13e-05 mem: 47% pow: 647.457 W 0: INFO 26-04-29 21:08:03.460864 - 5:32:44 - step: 28950 acc: 0 loss: 1.4351 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6775 data: 0.0881 lr: 3.13e-05 mem: 47% pow: 623.913 W 0: INFO 26-04-29 21:08:17.520817 - 5:32:58 - step: 28960 acc: 0 loss: 1.0799 grad: 1.52e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6004 data: 0.0824 lr: 3.13e-05 mem: 47% pow: 664.21 W 0: INFO 26-04-29 21:08:31.179336 - 5:33:11 - step: 28970 acc: 0 loss: 1.5987 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6156 data: 0.0892 lr: 3.13e-05 mem: 47% pow: 650.104 W 0: INFO 26-04-29 21:08:46.286555 - 5:33:27 - step: 28980 acc: 0 loss: 1.386 grad: 1.54e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.598 data: 0.0837 lr: 3.13e-05 mem: 47% pow: 652.919 W 0: INFO 26-04-29 21:08:59.969579 - 5:33:40 - step: 28990 acc: 0 loss: 1.2216 grad: 1.60e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5774 data: 0.0908 lr: 3.13e-05 mem: 47% pow: 665.288 W 0: INFO 26-04-29 21:09:13.959444 - 5:33:54 - step: 29000 acc: 0 loss: 1.7057 grad: 1.56e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6195 data: 0.0841 lr: 3.12e-05 mem: 47% pow: 653.075 W 0: INFO 26-04-29 21:09:17.660592 - 5:33:58 - garbage collection 0: INFO 26-04-29 21:09:32.070244 - 5:34:12 - step: 29010 acc: 0 loss: 1.4796 grad: 1.64e-01 flops: 3.12e+14 wps: 3.62e+04 iter: 0.5954 data: 0.0804 lr: 3.12e-05 mem: 54% pow: 658.307 W 0: INFO 26-04-29 21:09:45.800462 - 5:34:26 - step: 29020 acc: 0 loss: 1.5631 grad: 1.61e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6436 data: 0.0772 lr: 3.12e-05 mem: 47% pow: 638.571 W 0: INFO 26-04-29 21:09:59.944884 - 5:34:40 - step: 29030 acc: 0 loss: 1.3013 grad: 1.73e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.7321 data: 0.0928 lr: 3.12e-05 mem: 47% pow: 590.939 W 0: INFO 26-04-29 21:10:13.697465 - 5:34:54 - step: 29040 acc: 0 loss: 1.2166 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5909 data: 0.0911 lr: 3.12e-05 mem: 47% pow: 656.641 W 0: INFO 26-04-29 21:10:27.357176 - 5:35:08 - step: 29050 acc: 0 loss: 1.9345 grad: 1.84e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5873 data: 0.109 lr: 3.12e-05 mem: 47% pow: 650.561 W 0: INFO 26-04-29 21:10:41.061939 - 5:35:21 - step: 29060 acc: 0 loss: 1.5919 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6387 data: 0.066 lr: 3.12e-05 mem: 47% pow: 659.55 W 0: INFO 26-04-29 21:10:54.993187 - 5:35:35 - step: 29070 acc: 0 loss: 1.5828 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6261 data: 0.0858 lr: 3.11e-05 mem: 47% pow: 648.334 W 0: INFO 26-04-29 21:11:08.617290 - 5:35:49 - step: 29080 acc: 0 loss: 1.5953 grad: 1.75e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6082 data: 0.0859 lr: 3.11e-05 mem: 47% pow: 655.385 W 0: INFO 26-04-29 21:11:22.520756 - 5:36:03 - step: 29090 acc: 0 loss: 1.2698 grad: 1.53e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6128 data: 0.081 lr: 3.11e-05 mem: 47% pow: 651.695 W 0: INFO 26-04-29 21:11:36.454750 - 5:36:17 - step: 29100 acc: 0 loss: 1.2733 grad: 1.59e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6239 data: 0.0713 lr: 3.11e-05 mem: 47% pow: 651.648 W 0: INFO 26-04-29 21:11:53.123682 - 5:36:33 - step: 29110 acc: 0 loss: 1.396 grad: 1.54e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6116 data: 0.0753 lr: 3.11e-05 mem: 54% pow: 660.682 W 0: INFO 26-04-29 21:12:06.633288 - 5:36:47 - step: 29120 acc: 0 loss: 1.5023 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6078 data: 0.0886 lr: 3.11e-05 mem: 47% pow: 642.433 W 0: INFO 26-04-29 21:12:20.328150 - 5:37:01 - step: 29130 acc: 0 loss: 1.6151 grad: 1.48e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6446 data: 0.0881 lr: 3.11e-05 mem: 47% pow: 634.592 W 0: INFO 26-04-29 21:12:34.084208 - 5:37:14 - step: 29140 acc: 0 loss: 1.5154 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6148 data: 0.0845 lr: 3.10e-05 mem: 47% pow: 662.044 W 0: INFO 26-04-29 21:12:47.675127 - 5:37:28 - step: 29150 acc: 0 loss: 1.5232 grad: 1.69e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6178 data: 0.0604 lr: 3.10e-05 mem: 47% pow: 657.67 W 0: INFO 26-04-29 21:13:01.696792 - 5:37:42 - step: 29160 acc: 0 loss: 1.3186 grad: 1.67e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6186 data: 0.0711 lr: 3.10e-05 mem: 47% pow: 660.551 W 0: INFO 26-04-29 21:13:15.934413 - 5:37:56 - step: 29170 acc: 0 loss: 1.3651 grad: 1.58e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6079 data: 0.0819 lr: 3.10e-05 mem: 47% pow: 663.28 W 0: INFO 26-04-29 21:13:29.578555 - 5:38:10 - step: 29180 acc: 0 loss: 1.3439 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5837 data: 0.0874 lr: 3.10e-05 mem: 47% pow: 669.772 W 0: INFO 26-04-29 21:13:43.782665 - 5:38:24 - step: 29190 acc: 0 loss: 1.313 grad: 1.56e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6709 data: 0.0871 lr: 3.10e-05 mem: 47% pow: 606.453 W 0: INFO 26-04-29 21:13:57.691430 - 5:38:38 - step: 29200 acc: 0 loss: 1.615 grad: 1.51e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7309 data: 0.0842 lr: 3.10e-05 mem: 47% pow: 583.864 W 0: INFO 26-04-29 21:14:14.503292 - 5:38:55 - step: 29210 acc: 0 loss: 1.2287 grad: 1.54e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6656 data: 0.0762 lr: 3.09e-05 mem: 54% pow: 624.762 W 0: INFO 26-04-29 21:14:28.094449 - 5:39:08 - step: 29220 acc: 0 loss: 1.0143 grad: 1.60e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5974 data: 0.0794 lr: 3.09e-05 mem: 47% pow: 661.351 W 0: INFO 26-04-29 21:14:41.626211 - 5:39:22 - step: 29230 acc: 0 loss: 1.6214 grad: 1.91e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5867 data: 0.0898 lr: 3.09e-05 mem: 47% pow: 666.984 W 0: INFO 26-04-29 21:14:55.681293 - 5:39:36 - step: 29240 acc: 0 loss: 1.7632 grad: 1.56e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6981 data: 0.0833 lr: 3.09e-05 mem: 47% pow: 607.186 W 0: INFO 26-04-29 21:15:09.278903 - 5:39:50 - step: 29250 acc: 0 loss: 1.0717 grad: 1.76e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5878 data: 0.0872 lr: 3.09e-05 mem: 47% pow: 663.56 W 0: INFO 26-04-29 21:15:23.371537 - 5:40:04 - step: 29260 acc: 0 loss: 1.2071 grad: 1.55e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5785 data: 0.1092 lr: 3.09e-05 mem: 47% pow: 659.371 W 0: INFO 26-04-29 21:15:37.083992 - 5:40:17 - step: 29270 acc: 0 loss: 1.1444 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6733 data: 0.0855 lr: 3.08e-05 mem: 47% pow: 615.986 W 0: INFO 26-04-29 21:15:50.650070 - 5:40:31 - step: 29280 acc: 0 loss: 1.847 grad: 1.52e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5923 data: 0.0926 lr: 3.08e-05 mem: 47% pow: 660.115 W 0: INFO 26-04-29 21:16:04.442180 - 5:40:45 - step: 29290 acc: 0 loss: 1.6159 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5823 data: 0.1021 lr: 3.08e-05 mem: 47% pow: 663.887 W 0: INFO 26-04-29 21:16:18.362749 - 5:40:59 - step: 29300 acc: 0 loss: 1.3161 grad: 1.81e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6113 data: 0.0904 lr: 3.08e-05 mem: 47% pow: 661.154 W 0: INFO 26-04-29 21:16:34.960798 - 5:41:15 - step: 29310 acc: 0 loss: 1.7084 grad: 1.74e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6669 data: 0.0959 lr: 3.08e-05 mem: 54% pow: 609.834 W 0: INFO 26-04-29 21:16:48.571722 - 5:41:29 - step: 29320 acc: 0 loss: 1.325 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6375 data: 0.0893 lr: 3.08e-05 mem: 47% pow: 634.819 W 0: INFO 26-04-29 21:17:02.282175 - 5:41:43 - step: 29330 acc: 0 loss: 1.1594 grad: 1.74e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6017 data: 0.0758 lr: 3.08e-05 mem: 47% pow: 661.202 W 0: INFO 26-04-29 21:17:16.061418 - 5:41:56 - step: 29340 acc: 0 loss: 1.4043 grad: 1.55e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6139 data: 0.0877 lr: 3.07e-05 mem: 47% pow: 651.374 W 0: INFO 26-04-29 21:17:29.654774 - 5:42:10 - step: 29350 acc: 0 loss: 1.833 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5848 data: 0.0954 lr: 3.07e-05 mem: 47% pow: 684.798 W 0: INFO 26-04-29 21:17:43.154521 - 5:42:23 - step: 29360 acc: 0 loss: 1.2529 grad: 1.60e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5947 data: 0.0923 lr: 3.07e-05 mem: 47% pow: 660.145 W 0: INFO 26-04-29 21:17:56.827874 - 5:42:37 - step: 29370 acc: 0 loss: 1.9506 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5792 data: 0.1077 lr: 3.07e-05 mem: 47% pow: 654.88 W 0: INFO 26-04-29 21:18:10.503567 - 5:42:51 - step: 29380 acc: 0 loss: 1.1994 grad: 1.60e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5895 data: 0.0953 lr: 3.07e-05 mem: 47% pow: 661.899 W 0: INFO 26-04-29 21:18:24.213715 - 5:43:05 - step: 29390 acc: 0 loss: 1.2354 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6315 data: 0.0625 lr: 3.07e-05 mem: 47% pow: 657.69 W 0: INFO 26-04-29 21:18:37.769150 - 5:43:18 - step: 29400 acc: 0 loss: 1.4365 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6451 data: 0.0865 lr: 3.07e-05 mem: 47% pow: 632.271 W 0: INFO 26-04-29 21:18:54.652510 - 5:43:35 - step: 29410 acc: 0 loss: 1.5697 grad: 1.55e-01 flops: 3.35e+14 wps: 3.88e+04 iter: 0.6512 data: 0.0763 lr: 3.06e-05 mem: 54% pow: 639.965 W 0: INFO 26-04-29 21:19:08.283282 - 5:43:49 - step: 29420 acc: 0 loss: 1.4554 grad: 1.59e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5806 data: 0.0943 lr: 3.06e-05 mem: 47% pow: 664.48 W 0: INFO 26-04-29 21:19:22.117309 - 5:44:02 - step: 29430 acc: 0 loss: 1.4014 grad: 1.57e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5997 data: 0.0952 lr: 3.06e-05 mem: 47% pow: 652.075 W 0: INFO 26-04-29 21:19:35.658421 - 5:44:16 - step: 29440 acc: 0 loss: 1.1941 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5806 data: 0.0938 lr: 3.06e-05 mem: 47% pow: 667.597 W 0: INFO 26-04-29 21:19:49.314193 - 5:44:30 - step: 29450 acc: 0 loss: 1.8246 grad: 1.70e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6112 data: 0.0928 lr: 3.06e-05 mem: 47% pow: 649.919 W 0: INFO 26-04-29 21:20:03.103647 - 5:44:43 - step: 29460 acc: 0 loss: 1.3682 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.8179 data: 0.0758 lr: 3.06e-05 mem: 47% pow: 549.026 W 0: INFO 26-04-29 21:20:16.789285 - 5:44:57 - step: 29470 acc: 0 loss: 1.743 grad: 2.07e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5787 data: 0.0893 lr: 3.06e-05 mem: 47% pow: 667.48 W 0: INFO 26-04-29 21:20:30.359176 - 5:45:11 - step: 29480 acc: 0 loss: 1.3595 grad: 1.62e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5879 data: 0.0908 lr: 3.05e-05 mem: 47% pow: 662.749 W 0: INFO 26-04-29 21:20:43.874011 - 5:45:24 - step: 29490 acc: 0 loss: 1.6833 grad: 1.63e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5873 data: 0.089 lr: 3.05e-05 mem: 47% pow: 665.104 W 0: INFO 26-04-29 21:20:57.535036 - 5:45:38 - step: 29500 acc: 0 loss: 1.6548 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6065 data: 0.0769 lr: 3.05e-05 mem: 47% pow: 662.619 W 0: INFO 26-04-29 21:21:14.072177 - 5:45:54 - step: 29510 acc: 0 loss: 0.9756 grad: 1.59e-01 flops: 3.42e+14 wps: 3.96e+04 iter: 0.6305 data: 0.0952 lr: 3.05e-05 mem: 54% pow: 650.688 W 0: INFO 26-04-29 21:21:27.844404 - 5:46:08 - step: 29520 acc: 0 loss: 1.4793 grad: 1.55e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6053 data: 0.0909 lr: 3.05e-05 mem: 47% pow: 651.733 W 0: INFO 26-04-29 21:21:41.543056 - 5:46:22 - step: 29530 acc: 0 loss: 1.0047 grad: 1.64e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6427 data: 0.085 lr: 3.05e-05 mem: 47% pow: 634.045 W 0: INFO 26-04-29 21:21:55.511274 - 5:46:36 - step: 29540 acc: 0 loss: 1.1262 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5928 data: 0.0921 lr: 3.04e-05 mem: 47% pow: 665.139 W 0: INFO 26-04-29 21:22:09.380054 - 5:46:50 - step: 29550 acc: 0 loss: 1.0864 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.7446 data: 0.0928 lr: 3.04e-05 mem: 47% pow: 574.203 W 0: INFO 26-04-29 21:22:23.026419 - 5:47:03 - step: 29560 acc: 0 loss: 1.3565 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5981 data: 0.0858 lr: 3.04e-05 mem: 47% pow: 661.141 W 0: INFO 26-04-29 21:22:36.520849 - 5:47:17 - step: 29570 acc: 0 loss: 1.3959 grad: 1.52e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5857 data: 0.0937 lr: 3.04e-05 mem: 47% pow: 667.609 W 0: INFO 26-04-29 21:22:50.141924 - 5:47:30 - step: 29580 acc: 0 loss: 1.2814 grad: 1.60e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6052 data: 0.0891 lr: 3.04e-05 mem: 47% pow: 652.265 W 0: INFO 26-04-29 21:23:03.630871 - 5:47:44 - step: 29590 acc: 0 loss: 1.3876 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5942 data: 0.0895 lr: 3.04e-05 mem: 47% pow: 662.855 W 0: INFO 26-04-29 21:23:17.148402 - 5:47:57 - step: 29600 acc: 0 loss: 1.6314 grad: 1.73e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6175 data: 0.0782 lr: 3.04e-05 mem: 47% pow: 645.879 W 0: INFO 26-04-29 21:23:33.597514 - 5:48:14 - step: 29610 acc: 0 loss: 1.4025 grad: 1.61e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6602 data: 0.0735 lr: 3.03e-05 mem: 54% pow: 628.186 W 0: INFO 26-04-29 21:23:47.119366 - 5:48:27 - step: 29620 acc: 0 loss: 1.8995 grad: 1.80e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5974 data: 0.0938 lr: 3.03e-05 mem: 47% pow: 659.134 W 0: INFO 26-04-29 21:24:00.990283 - 5:48:41 - step: 29630 acc: 0 loss: 1.266 grad: 1.81e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5784 data: 0.0946 lr: 3.03e-05 mem: 47% pow: 667.452 W 0: INFO 26-04-29 21:24:14.547528 - 5:48:55 - step: 29640 acc: 0 loss: 1.7637 grad: 1.64e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6018 data: 0.0824 lr: 3.03e-05 mem: 47% pow: 662.319 W 0: INFO 26-04-29 21:24:28.178733 - 5:49:08 - step: 29650 acc: 0 loss: 1.5683 grad: 1.63e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5861 data: 0.0905 lr: 3.03e-05 mem: 47% pow: 659.74 W 0: INFO 26-04-29 21:24:41.646515 - 5:49:22 - step: 29660 acc: 0 loss: 1.3724 grad: 1.58e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5876 data: 0.0962 lr: 3.03e-05 mem: 47% pow: 663.764 W 0: INFO 26-04-29 21:24:55.175487 - 5:49:35 - step: 29670 acc: 0 loss: 1.5824 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6105 data: 0.0938 lr: 3.03e-05 mem: 47% pow: 648.341 W 0: INFO 26-04-29 21:25:08.843112 - 5:49:49 - step: 29680 acc: 0 loss: 1.2848 grad: 1.51e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5915 data: 0.0903 lr: 3.02e-05 mem: 47% pow: 676.087 W 0: INFO 26-04-29 21:25:22.525563 - 5:50:03 - step: 29690 acc: 0 loss: 1.2739 grad: 1.68e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.7347 data: 0.0867 lr: 3.02e-05 mem: 47% pow: 583.783 W 0: INFO 26-04-29 21:25:36.401660 - 5:50:17 - step: 29700 acc: 0 loss: 1.7299 grad: 1.83e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6304 data: 0.0843 lr: 3.02e-05 mem: 47% pow: 639.859 W 0: INFO 26-04-29 21:25:52.950227 - 5:50:33 - step: 29710 acc: 0 loss: 1.1491 grad: 1.70e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.5953 data: 0.0879 lr: 3.02e-05 mem: 54% pow: 671.997 W 0: INFO 26-04-29 21:26:06.491961 - 5:50:47 - step: 29720 acc: 0 loss: 1.2052 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5867 data: 0.0906 lr: 3.02e-05 mem: 47% pow: 677.996 W 0: INFO 26-04-29 21:26:19.923987 - 5:51:00 - step: 29730 acc: 0 loss: 1.3437 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5805 data: 0.1034 lr: 3.02e-05 mem: 47% pow: 662.477 W 0: INFO 26-04-29 21:26:33.356395 - 5:51:14 - step: 29740 acc: 0 loss: 1.1368 grad: 1.65e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.6098 data: 0.0917 lr: 3.01e-05 mem: 47% pow: 647.901 W 0: INFO 26-04-29 21:26:46.983607 - 5:51:27 - step: 29750 acc: 0 loss: 1.7005 grad: 1.71e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.644 data: 0.0771 lr: 3.01e-05 mem: 47% pow: 637.062 W 0: INFO 26-04-29 21:27:00.476384 - 5:51:41 - step: 29760 acc: 0 loss: 1.5842 grad: 1.64e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5913 data: 0.0841 lr: 3.01e-05 mem: 47% pow: 672.076 W 0: INFO 26-04-29 21:27:13.944388 - 5:51:54 - step: 29770 acc: 0 loss: 1.1555 grad: 1.74e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6172 data: 0.0794 lr: 3.01e-05 mem: 47% pow: 659.379 W 0: INFO 26-04-29 21:27:27.550400 - 5:52:08 - step: 29780 acc: 0 loss: 1.1397 grad: 1.71e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.7845 data: 0.0553 lr: 3.01e-05 mem: 47% pow: 593.232 W 0: INFO 26-04-29 21:27:41.049297 - 5:52:21 - step: 29790 acc: 0 loss: 1.3058 grad: 1.59e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6017 data: 0.0874 lr: 3.01e-05 mem: 47% pow: 672.641 W 0: INFO 26-04-29 21:27:54.662969 - 5:52:35 - step: 29800 acc: 0 loss: 1.1572 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.589 data: 0.0915 lr: 3.01e-05 mem: 47% pow: 657.575 W 0: INFO 26-04-29 21:28:11.122968 - 5:52:51 - step: 29810 acc: 0 loss: 1.4653 grad: 1.53e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.593 data: 0.0835 lr: 3.00e-05 mem: 54% pow: 654.532 W 0: INFO 26-04-29 21:28:24.705645 - 5:53:05 - step: 29820 acc: 0 loss: 1.4174 grad: 1.71e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5926 data: 0.0961 lr: 3.00e-05 mem: 47% pow: 660.302 W 0: INFO 26-04-29 21:28:38.279716 - 5:53:19 - step: 29830 acc: 0 loss: 1.3374 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5946 data: 0.0873 lr: 3.00e-05 mem: 47% pow: 662.586 W 0: INFO 26-04-29 21:28:52.059161 - 5:53:32 - step: 29840 acc: 0 loss: 0.9929 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.591 data: 0.0906 lr: 3.00e-05 mem: 47% pow: 659.502 W 0: INFO 26-04-29 21:29:05.728600 - 5:53:46 - step: 29850 acc: 0 loss: 1.2644 grad: 1.58e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5967 data: 0.0934 lr: 3.00e-05 mem: 47% pow: 656.075 W 0: INFO 26-04-29 21:29:19.301873 - 5:54:00 - step: 29860 acc: 0 loss: 1.4429 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6055 data: 0.0957 lr: 3.00e-05 mem: 47% pow: 648.762 W 0: INFO 26-04-29 21:29:33.014346 - 5:54:13 - step: 29870 acc: 0 loss: 1.0086 grad: 1.67e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5901 data: 0.0885 lr: 3.00e-05 mem: 47% pow: 662.598 W 0: INFO 26-04-29 21:29:46.938964 - 5:54:27 - step: 29880 acc: 0 loss: 1.2479 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6002 data: 0.0937 lr: 2.99e-05 mem: 47% pow: 663.081 W 0: INFO 26-04-29 21:30:00.493238 - 5:54:41 - step: 29890 acc: 0 loss: 1.5719 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.608 data: 0.0654 lr: 2.99e-05 mem: 47% pow: 669.828 W 0: INFO 26-04-29 21:30:14.212894 - 5:54:55 - step: 29900 acc: 0 loss: 1.236 grad: 1.64e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6162 data: 0.0913 lr: 2.99e-05 mem: 47% pow: 649.263 W 0: INFO 26-04-29 21:30:30.668193 - 5:55:11 - step: 29910 acc: 0 loss: 1.5866 grad: 1.60e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5886 data: 0.0826 lr: 2.99e-05 mem: 54% pow: 669.637 W 0: INFO 26-04-29 21:30:44.057108 - 5:55:24 - step: 29920 acc: 0 loss: 1.4098 grad: 1.64e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5887 data: 0.0927 lr: 2.99e-05 mem: 47% pow: 665.884 W 0: INFO 26-04-29 21:30:57.734730 - 5:55:38 - step: 29930 acc: 0 loss: 1.0565 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5937 data: 0.0812 lr: 2.99e-05 mem: 47% pow: 671.359 W 0: INFO 26-04-29 21:31:11.356333 - 5:55:52 - step: 29940 acc: 0 loss: 1.158 grad: 1.72e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6208 data: 0.0802 lr: 2.99e-05 mem: 47% pow: 647.098 W 0: INFO 26-04-29 21:31:25.050569 - 5:56:05 - step: 29950 acc: 0 loss: 1.5909 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6839 data: 0.0984 lr: 2.98e-05 mem: 47% pow: 601.026 W 0: INFO 26-04-29 21:31:38.459109 - 5:56:19 - step: 29960 acc: 0 loss: 1.0362 grad: 1.61e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5907 data: 0.0907 lr: 2.98e-05 mem: 47% pow: 665.455 W 0: INFO 26-04-29 21:31:52.139956 - 5:56:32 - step: 29970 acc: 0 loss: 1.3131 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5866 data: 0.0931 lr: 2.98e-05 mem: 47% pow: 663.166 W 0: INFO 26-04-29 21:32:05.718994 - 5:56:46 - step: 29980 acc: 0 loss: 1.1737 grad: 1.67e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6094 data: 0.091 lr: 2.98e-05 mem: 47% pow: 649.223 W 0: INFO 26-04-29 21:32:19.311837 - 5:57:00 - step: 29990 acc: 0 loss: 1.1113 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5933 data: 0.0908 lr: 2.98e-05 mem: 47% pow: 679.001 W 0: INFO 26-04-29 21:32:32.875741 - 5:57:13 - step: 30000 acc: 0 loss: 1.128 grad: 1.58e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6205 data: 0.0921 lr: 2.98e-05 mem: 47% pow: 647.634 W 0: INFO 26-04-29 21:32:32.884054 - 5:57:13 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000030000 0: INFO 26-04-29 21:32:32.884468 - 5:57:13 - Saving... 0: INFO 26-04-29 21:32:38.191310 - 5:57:18 - State dict saved! 0: INFO 26-04-29 21:32:38.282271 - 5:57:19 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000030000/train_state_00000.json 0: INFO 26-04-29 21:32:38.286778 - 5:57:19 - Train state saved ! 0: INFO 26-04-29 21:32:38.287168 - 5:57:19 - Cleaning up checkpoints... 0: INFO 26-04-29 21:32:38.287671 - 5:57:19 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000025000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000030000')] 0: INFO 26-04-29 21:32:38.287867 - 5:57:19 - Eval folders: [] 0: INFO 26-04-29 21:32:38.288025 - 5:57:19 - Other folders: [] 0: INFO 26-04-29 21:32:38.288203 - 5:57:19 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000025000')} 0: INFO 26-04-29 21:32:42.394369 - 5:57:23 - garbage collection 0: INFO 26-04-29 21:32:56.699334 - 5:57:37 - step: 30010 acc: 0 loss: 1.2959 grad: 1.56e-01 flops: 2.37e+14 wps: 2.75e+04 iter: 0.6106 data: 0.0883 lr: 2.97e-05 mem: 54% pow: 645.989 W 0: INFO 26-04-29 21:33:10.118580 - 5:57:50 - step: 30020 acc: 0 loss: 1.2722 grad: 1.67e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5974 data: 0.0861 lr: 2.97e-05 mem: 47% pow: 664.652 W 0: INFO 26-04-29 21:33:23.551469 - 5:58:04 - step: 30030 acc: 0 loss: 1.5493 grad: 1.62e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5813 data: 0.1075 lr: 2.97e-05 mem: 47% pow: 657.246 W 0: INFO 26-04-29 21:33:37.121707 - 5:58:17 - step: 30040 acc: 0 loss: 1.4834 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6004 data: 0.0838 lr: 2.97e-05 mem: 47% pow: 671.37 W 0: INFO 26-04-29 21:33:50.853694 - 5:58:31 - step: 30050 acc: 0 loss: 1.2336 grad: 1.62e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6215 data: 0.0902 lr: 2.97e-05 mem: 47% pow: 648.492 W 0: INFO 26-04-29 21:34:04.523093 - 5:58:45 - step: 30060 acc: 0 loss: 1.5943 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6554 data: 0.0949 lr: 2.97e-05 mem: 47% pow: 628.576 W 0: INFO 26-04-29 21:34:18.084671 - 5:58:58 - step: 30070 acc: 0 loss: 1.2157 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5809 data: 0.1103 lr: 2.97e-05 mem: 47% pow: 662.683 W 0: INFO 26-04-29 21:34:31.949685 - 5:59:12 - step: 30080 acc: 0 loss: 1.2978 grad: 1.63e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.605 data: 0.086 lr: 2.96e-05 mem: 47% pow: 655.018 W 0: INFO 26-04-29 21:34:45.677222 - 5:59:26 - step: 30090 acc: 0 loss: 1.3138 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5933 data: 0.0896 lr: 2.96e-05 mem: 47% pow: 663.345 W 0: INFO 26-04-29 21:34:58.975814 - 5:59:39 - step: 30100 acc: 0 loss: 1.4285 grad: 1.64e-01 flops: 4.25e+14 wps: 4.93e+04 iter: 0.5904 data: 0.0904 lr: 2.96e-05 mem: 47% pow: 654.751 W 0: INFO 26-04-29 21:35:15.868290 - 5:59:56 - step: 30110 acc: 0 loss: 1.541 grad: 1.69e-01 flops: 3.35e+14 wps: 3.88e+04 iter: 0.6542 data: 0.0795 lr: 2.96e-05 mem: 54% pow: 629.899 W 0: INFO 26-04-29 21:35:29.517854 - 6:00:10 - step: 30120 acc: 0 loss: 1.2563 grad: 1.64e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6036 data: 0.094 lr: 2.96e-05 mem: 47% pow: 656.984 W 0: INFO 26-04-29 21:35:43.298106 - 6:00:24 - step: 30130 acc: 0 loss: 1.6728 grad: 1.60e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.711 data: 0.0908 lr: 2.96e-05 mem: 47% pow: 603.334 W 0: INFO 26-04-29 21:35:56.857044 - 6:00:37 - step: 30140 acc: 0 loss: 1.4275 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5984 data: 0.0841 lr: 2.96e-05 mem: 47% pow: 655.573 W 0: INFO 26-04-29 21:36:10.418076 - 6:00:51 - step: 30150 acc: 0 loss: 1.423 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6021 data: 0.0805 lr: 2.95e-05 mem: 47% pow: 666.568 W 0: INFO 26-04-29 21:36:24.304363 - 6:01:05 - step: 30160 acc: 0 loss: 1.3947 grad: 1.63e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6038 data: 0.0864 lr: 2.95e-05 mem: 47% pow: 658.006 W 0: INFO 26-04-29 21:36:37.831982 - 6:01:18 - step: 30170 acc: 0 loss: 1.4251 grad: 1.68e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5984 data: 0.0948 lr: 2.95e-05 mem: 47% pow: 652.226 W 0: INFO 26-04-29 21:36:51.315935 - 6:01:32 - step: 30180 acc: 0 loss: 1.177 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6078 data: 0.0825 lr: 2.95e-05 mem: 47% pow: 668.273 W 0: INFO 26-04-29 21:37:05.188843 - 6:01:45 - step: 30190 acc: 0 loss: 1.6184 grad: 1.62e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5921 data: 0.081 lr: 2.95e-05 mem: 47% pow: 665.046 W 0: INFO 26-04-29 21:37:18.684125 - 6:01:59 - step: 30200 acc: 0 loss: 1.1078 grad: 1.66e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.581 data: 0.1006 lr: 2.95e-05 mem: 47% pow: 661.123 W 0: INFO 26-04-29 21:37:35.462073 - 6:02:16 - step: 30210 acc: 0 loss: 1.1223 grad: 1.63e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.616 data: 0.0856 lr: 2.94e-05 mem: 54% pow: 652.038 W 0: INFO 26-04-29 21:37:49.131569 - 6:02:29 - step: 30220 acc: 0 loss: 1.4694 grad: 1.59e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.622 data: 0.0946 lr: 2.94e-05 mem: 47% pow: 639.997 W 0: INFO 26-04-29 21:38:02.813109 - 6:02:43 - step: 30230 acc: 0 loss: 1.0806 grad: 1.82e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.634 data: 0.1049 lr: 2.94e-05 mem: 47% pow: 625.816 W 0: INFO 26-04-29 21:38:16.471977 - 6:02:57 - step: 30240 acc: 0 loss: 1.3429 grad: 1.79e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5792 data: 0.0957 lr: 2.94e-05 mem: 47% pow: 666.104 W 0: INFO 26-04-29 21:38:29.999871 - 6:03:10 - step: 30250 acc: 0 loss: 1.5888 grad: 1.64e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6061 data: 0.0898 lr: 2.94e-05 mem: 47% pow: 653.715 W 0: INFO 26-04-29 21:38:43.482726 - 6:03:24 - step: 30260 acc: 0 loss: 1.3132 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5991 data: 0.0867 lr: 2.94e-05 mem: 47% pow: 657.682 W 0: INFO 26-04-29 21:38:57.004904 - 6:03:37 - step: 30270 acc: 0 loss: 1.2288 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5902 data: 0.0928 lr: 2.94e-05 mem: 47% pow: 660.191 W 0: INFO 26-04-29 21:39:10.609790 - 6:03:51 - step: 30280 acc: 0 loss: 1.3886 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6028 data: 0.0909 lr: 2.93e-05 mem: 47% pow: 655.532 W 0: INFO 26-04-29 21:39:24.047640 - 6:04:04 - step: 30290 acc: 0 loss: 1.4609 grad: 1.82e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5941 data: 0.0966 lr: 2.93e-05 mem: 47% pow: 661.341 W 0: INFO 26-04-29 21:39:37.608816 - 6:04:18 - step: 30300 acc: 0 loss: 1.3098 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6128 data: 0.0696 lr: 2.93e-05 mem: 47% pow: 666.088 W 0: INFO 26-04-29 21:39:54.181856 - 6:04:34 - step: 30310 acc: 0 loss: 1.0733 grad: 1.59e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6153 data: 0.093 lr: 2.93e-05 mem: 54% pow: 652.433 W 0: INFO 26-04-29 21:40:07.634917 - 6:04:48 - step: 30320 acc: 0 loss: 1.07 grad: 1.59e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.595 data: 0.1018 lr: 2.93e-05 mem: 47% pow: 659.501 W 0: INFO 26-04-29 21:40:21.146373 - 6:05:01 - step: 30330 acc: 0 loss: 1.3137 grad: 1.66e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.603 data: 0.0903 lr: 2.93e-05 mem: 47% pow: 657.344 W 0: INFO 26-04-29 21:40:35.075485 - 6:05:15 - step: 30340 acc: 0 loss: 1.2214 grad: 1.72e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5988 data: 0.0909 lr: 2.93e-05 mem: 47% pow: 650.37 W 0: INFO 26-04-29 21:40:48.671984 - 6:05:29 - step: 30350 acc: 0 loss: 1.2347 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6044 data: 0.0897 lr: 2.92e-05 mem: 47% pow: 659.752 W 0: INFO 26-04-29 21:41:02.179636 - 6:05:42 - step: 30360 acc: 0 loss: 1.29 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6039 data: 0.0813 lr: 2.92e-05 mem: 47% pow: 668.283 W 0: INFO 26-04-29 21:41:15.741908 - 6:05:56 - step: 30370 acc: 0 loss: 1.3805 grad: 1.62e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.592 data: 0.0892 lr: 2.92e-05 mem: 47% pow: 673.443 W 0: INFO 26-04-29 21:41:29.278056 - 6:06:10 - step: 30380 acc: 0 loss: 1.3404 grad: 1.65e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6004 data: 0.0987 lr: 2.92e-05 mem: 47% pow: 637.645 W 0: INFO 26-04-29 21:41:42.905935 - 6:06:23 - step: 30390 acc: 0 loss: 1.334 grad: 1.55e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6091 data: 0.0925 lr: 2.92e-05 mem: 47% pow: 654.952 W 0: INFO 26-04-29 21:41:56.653072 - 6:06:37 - step: 30400 acc: 0 loss: 1.3552 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5934 data: 0.0861 lr: 2.92e-05 mem: 47% pow: 663.925 W 0: INFO 26-04-29 21:42:13.085691 - 6:06:53 - step: 30410 acc: 0 loss: 1.2915 grad: 1.63e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6049 data: 0.0826 lr: 2.92e-05 mem: 54% pow: 654.22 W 0: INFO 26-04-29 21:42:26.703058 - 6:07:07 - step: 30420 acc: 0 loss: 0.9332 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.61 data: 0.0924 lr: 2.91e-05 mem: 47% pow: 647.613 W 0: INFO 26-04-29 21:42:40.322448 - 6:07:21 - step: 30430 acc: 0 loss: 1.2866 grad: 1.68e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5977 data: 0.091 lr: 2.91e-05 mem: 47% pow: 661.612 W 0: INFO 26-04-29 21:42:53.775092 - 6:07:34 - step: 30440 acc: 0 loss: 1.5627 grad: 1.75e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5838 data: 0.0936 lr: 2.91e-05 mem: 47% pow: 651.569 W 0: INFO 26-04-29 21:43:07.625702 - 6:07:48 - step: 30450 acc: 0 loss: 1.4434 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6311 data: 0.1007 lr: 2.91e-05 mem: 47% pow: 632.103 W 0: INFO 26-04-29 21:43:21.366277 - 6:08:02 - step: 30460 acc: 0 loss: 1.1061 grad: 1.69e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6071 data: 0.0956 lr: 2.91e-05 mem: 47% pow: 654.409 W 0: INFO 26-04-29 21:43:34.955328 - 6:08:15 - step: 30470 acc: 0 loss: 1.134 grad: 1.76e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6016 data: 0.0942 lr: 2.91e-05 mem: 47% pow: 658.205 W 0: INFO 26-04-29 21:43:48.803987 - 6:08:29 - step: 30480 acc: 0 loss: 1.4921 grad: 1.61e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6048 data: 0.0947 lr: 2.90e-05 mem: 47% pow: 654.099 W 0: INFO 26-04-29 21:44:02.608275 - 6:08:43 - step: 30490 acc: 0 loss: 1.1706 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.63 data: 0.085 lr: 2.90e-05 mem: 47% pow: 635.697 W 0: INFO 26-04-29 21:44:16.416634 - 6:08:57 - step: 30500 acc: 0 loss: 1.4091 grad: 1.66e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5948 data: 0.0873 lr: 2.90e-05 mem: 47% pow: 671.988 W 0: INFO 26-04-29 21:44:33.332923 - 6:09:14 - step: 30510 acc: 0 loss: 1.1744 grad: 1.68e-01 flops: 3.34e+14 wps: 3.87e+04 iter: 0.5849 data: 0.0941 lr: 2.90e-05 mem: 54% pow: 657.632 W 0: INFO 26-04-29 21:44:46.718069 - 6:09:27 - step: 30520 acc: 0 loss: 1.4183 grad: 1.59e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6118 data: 0.0911 lr: 2.90e-05 mem: 47% pow: 649.803 W 0: INFO 26-04-29 21:45:00.404378 - 6:09:41 - step: 30530 acc: 0 loss: 1.2432 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6988 data: 0.0828 lr: 2.90e-05 mem: 47% pow: 599.578 W 0: INFO 26-04-29 21:45:13.978756 - 6:09:54 - step: 30540 acc: 0 loss: 1.3011 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5804 data: 0.0856 lr: 2.90e-05 mem: 47% pow: 677.709 W 0: INFO 26-04-29 21:45:27.729923 - 6:10:08 - step: 30550 acc: 0 loss: 1.1287 grad: 1.72e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6065 data: 0.0844 lr: 2.89e-05 mem: 47% pow: 658.278 W 0: INFO 26-04-29 21:45:41.252485 - 6:10:22 - step: 30560 acc: 0 loss: 1.5254 grad: 1.55e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.634 data: 0.0423 lr: 2.89e-05 mem: 47% pow: 662.512 W 0: INFO 26-04-29 21:45:54.848564 - 6:10:35 - step: 30570 acc: 0 loss: 0.9853 grad: 1.60e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6227 data: 0.0842 lr: 2.89e-05 mem: 47% pow: 664.295 W 0: INFO 26-04-29 21:46:08.817628 - 6:10:49 - step: 30580 acc: 0 loss: 1.2843 grad: 1.60e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.8743 data: 0.0858 lr: 2.89e-05 mem: 47% pow: 503.631 W 0: INFO 26-04-29 21:46:22.987785 - 6:11:03 - step: 30590 acc: 0 loss: 1.1574 grad: 1.60e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.7369 data: 0.0549 lr: 2.89e-05 mem: 47% pow: 601.612 W 0: INFO 26-04-29 21:46:36.909302 - 6:11:17 - step: 30600 acc: 0 loss: 1.2973 grad: 1.54e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6355 data: 0.1075 lr: 2.89e-05 mem: 47% pow: 625.395 W 0: INFO 26-04-29 21:46:53.503796 - 6:11:34 - step: 30610 acc: 0 loss: 1.4553 grad: 1.64e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6038 data: 0.0866 lr: 2.89e-05 mem: 54% pow: 666.584 W 0: INFO 26-04-29 21:47:07.241320 - 6:11:48 - step: 30620 acc: 0 loss: 1.2136 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5914 data: 0.0859 lr: 2.88e-05 mem: 47% pow: 661.91 W 0: INFO 26-04-29 21:47:20.734800 - 6:12:01 - step: 30630 acc: 0 loss: 1.0234 grad: 1.70e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6047 data: 0.0753 lr: 2.88e-05 mem: 47% pow: 662.064 W 0: INFO 26-04-29 21:47:34.374741 - 6:12:15 - step: 30640 acc: 0 loss: 1.0603 grad: 1.61e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6526 data: 0.0261 lr: 2.88e-05 mem: 47% pow: 654.903 W 0: INFO 26-04-29 21:47:48.137091 - 6:12:28 - step: 30650 acc: 0 loss: 1.1348 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6424 data: 0.0772 lr: 2.88e-05 mem: 47% pow: 635.437 W 0: INFO 26-04-29 21:48:02.207306 - 6:12:43 - step: 30660 acc: 0 loss: 1.1681 grad: 1.55e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5979 data: 0.0861 lr: 2.88e-05 mem: 47% pow: 666.044 W 0: INFO 26-04-29 21:48:16.204672 - 6:12:57 - step: 30670 acc: 0 loss: 1.2344 grad: 1.57e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6065 data: 0.0795 lr: 2.88e-05 mem: 47% pow: 666.083 W 0: INFO 26-04-29 21:48:30.014606 - 6:13:10 - step: 30680 acc: 0 loss: 1.6027 grad: 1.72e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5986 data: 0.0818 lr: 2.87e-05 mem: 47% pow: 665.09 W 0: INFO 26-04-29 21:48:43.971019 - 6:13:24 - step: 30690 acc: 0 loss: 1.2024 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6078 data: 0.0868 lr: 2.87e-05 mem: 47% pow: 659.465 W 0: INFO 26-04-29 21:48:57.845881 - 6:13:38 - step: 30700 acc: 0 loss: 1.1806 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7776 data: 0.074 lr: 2.87e-05 mem: 47% pow: 580.954 W 0: INFO 26-04-29 21:49:14.594782 - 6:13:55 - step: 30710 acc: 0 loss: 1.0204 grad: 1.85e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6104 data: 0.0771 lr: 2.87e-05 mem: 54% pow: 656.877 W 0: INFO 26-04-29 21:49:29.076276 - 6:14:09 - step: 30720 acc: 0 loss: 1.4678 grad: 1.81e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.589 data: 0.0912 lr: 2.87e-05 mem: 47% pow: 658.619 W 0: INFO 26-04-29 21:49:43.340640 - 6:14:24 - step: 30730 acc: 0 loss: 1.3512 grad: 1.78e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.7023 data: 0.0804 lr: 2.87e-05 mem: 47% pow: 604.496 W 0: INFO 26-04-29 21:49:57.023165 - 6:14:37 - step: 30740 acc: 0 loss: 1.5008 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6015 data: 0.102 lr: 2.87e-05 mem: 47% pow: 655.047 W 0: INFO 26-04-29 21:50:10.662001 - 6:14:51 - step: 30750 acc: 0 loss: 1.2712 grad: 1.74e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6193 data: 0.0886 lr: 2.86e-05 mem: 47% pow: 665.478 W 0: INFO 26-04-29 21:50:24.761239 - 6:15:05 - step: 30760 acc: 0 loss: 1.3134 grad: 1.75e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5937 data: 0.0843 lr: 2.86e-05 mem: 47% pow: 656.278 W 0: INFO 26-04-29 21:50:38.304554 - 6:15:19 - step: 30770 acc: 0 loss: 1.5101 grad: 1.71e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6201 data: 0.0901 lr: 2.86e-05 mem: 47% pow: 659.451 W 0: INFO 26-04-29 21:50:52.058936 - 6:15:32 - step: 30780 acc: 0 loss: 1.1662 grad: 1.68e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6375 data: 0.0864 lr: 2.86e-05 mem: 47% pow: 639.364 W 0: INFO 26-04-29 21:51:06.201800 - 6:15:46 - step: 30790 acc: 0 loss: 1.4322 grad: 1.54e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6133 data: 0.0923 lr: 2.86e-05 mem: 47% pow: 652.422 W 0: INFO 26-04-29 21:51:20.028849 - 6:16:00 - step: 30800 acc: 0 loss: 1.3403 grad: 1.54e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.7278 data: 0.0038 lr: 2.86e-05 mem: 47% pow: 635.42 W 0: INFO 26-04-29 21:51:36.856592 - 6:16:17 - step: 30810 acc: 0 loss: 1.379 grad: 1.61e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5853 data: 0.0893 lr: 2.86e-05 mem: 54% pow: 666.187 W 0: INFO 26-04-29 21:51:50.454436 - 6:16:31 - step: 30820 acc: 0 loss: 1.4733 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6 data: 0.0913 lr: 2.85e-05 mem: 47% pow: 665.778 W 0: INFO 26-04-29 21:52:04.115061 - 6:16:44 - step: 30830 acc: 0 loss: 1.4543 grad: 1.63e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5808 data: 0.0921 lr: 2.85e-05 mem: 47% pow: 669.072 W 0: INFO 26-04-29 21:52:17.753075 - 6:16:58 - step: 30840 acc: 0 loss: 1.3381 grad: 1.52e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5865 data: 0.1043 lr: 2.85e-05 mem: 47% pow: 655.353 W 0: INFO 26-04-29 21:52:31.569900 - 6:17:12 - step: 30850 acc: 0 loss: 1.3175 grad: 1.62e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5942 data: 0.0974 lr: 2.85e-05 mem: 47% pow: 659.05 W 0: INFO 26-04-29 21:52:45.314306 - 6:17:26 - step: 30860 acc: 0 loss: 1.2734 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6131 data: 0.0876 lr: 2.85e-05 mem: 47% pow: 651.435 W 0: INFO 26-04-29 21:52:59.030617 - 6:17:39 - step: 30870 acc: 0 loss: 1.635 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5908 data: 0.0946 lr: 2.85e-05 mem: 47% pow: 681.523 W 0: INFO 26-04-29 21:53:12.734315 - 6:17:53 - step: 30880 acc: 0 loss: 1.4107 grad: 1.56e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5952 data: 0.0834 lr: 2.85e-05 mem: 47% pow: 686.462 W 0: INFO 26-04-29 21:53:26.781269 - 6:18:07 - step: 30890 acc: 0 loss: 1.4993 grad: 1.63e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6455 data: 0.0688 lr: 2.84e-05 mem: 47% pow: 632.293 W 0: INFO 26-04-29 21:53:40.517267 - 6:18:21 - step: 30900 acc: 0 loss: 1.2301 grad: 1.65e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6178 data: 0.0833 lr: 2.84e-05 mem: 47% pow: 647.131 W 0: INFO 26-04-29 21:53:57.597799 - 6:18:38 - step: 30910 acc: 0 loss: 1.1366 grad: 1.65e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.6462 data: 0.095 lr: 2.84e-05 mem: 54% pow: 624.182 W 0: INFO 26-04-29 21:54:11.462233 - 6:18:52 - step: 30920 acc: 0 loss: 1.4006 grad: 1.62e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6166 data: 0.0857 lr: 2.84e-05 mem: 47% pow: 649.184 W 0: INFO 26-04-29 21:54:25.296814 - 6:19:06 - step: 30930 acc: 0 loss: 1.3689 grad: 1.61e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6288 data: 0.0966 lr: 2.84e-05 mem: 47% pow: 654.074 W 0: INFO 26-04-29 21:54:39.133547 - 6:19:19 - step: 30940 acc: 0 loss: 1.4592 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7037 data: 0.0915 lr: 2.84e-05 mem: 47% pow: 595.281 W 0: INFO 26-04-29 21:54:52.841036 - 6:19:33 - step: 30950 acc: 0 loss: 1.5003 grad: 1.48e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5885 data: 0.0853 lr: 2.83e-05 mem: 47% pow: 664.516 W 0: INFO 26-04-29 21:55:06.570233 - 6:19:47 - step: 30960 acc: 0 loss: 1.6071 grad: 1.55e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6072 data: 0.0877 lr: 2.83e-05 mem: 47% pow: 680.376 W 0: INFO 26-04-29 21:55:20.423609 - 6:20:01 - step: 30970 acc: 0 loss: 1.3515 grad: 1.56e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6127 data: 0.0892 lr: 2.83e-05 mem: 47% pow: 650.133 W 0: INFO 26-04-29 21:55:34.469398 - 6:20:15 - step: 30980 acc: 0 loss: 1.502 grad: 1.63e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6205 data: 0.0911 lr: 2.83e-05 mem: 47% pow: 659.5 W 0: INFO 26-04-29 21:55:48.431511 - 6:20:29 - step: 30990 acc: 0 loss: 1.242 grad: 1.63e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5889 data: 0.0885 lr: 2.83e-05 mem: 47% pow: 659.571 W 0: INFO 26-04-29 21:56:02.250340 - 6:20:43 - step: 31000 acc: 0 loss: 1.2077 grad: 1.58e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6262 data: 0.0849 lr: 2.83e-05 mem: 47% pow: 642.799 W 0: INFO 26-04-29 21:56:05.977602 - 6:20:46 - garbage collection 0: INFO 26-04-29 21:56:20.356185 - 6:21:01 - step: 31010 acc: 0 loss: 1.1963 grad: 1.72e-01 flops: 3.12e+14 wps: 3.62e+04 iter: 0.6224 data: 0.0796 lr: 2.83e-05 mem: 54% pow: 648.929 W 0: INFO 26-04-29 21:56:34.157829 - 6:21:14 - step: 31020 acc: 0 loss: 1.5922 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6049 data: 0.0884 lr: 2.82e-05 mem: 47% pow: 659.12 W 0: INFO 26-04-29 21:56:48.031634 - 6:21:28 - step: 31030 acc: 0 loss: 1.3139 grad: 1.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.634 data: 0.0611 lr: 2.82e-05 mem: 47% pow: 649.38 W 0: INFO 26-04-29 21:57:01.672476 - 6:21:42 - step: 31040 acc: 0 loss: 1.6005 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5945 data: 0.1031 lr: 2.82e-05 mem: 47% pow: 643.559 W 0: INFO 26-04-29 21:57:15.699902 - 6:21:56 - step: 31050 acc: 0 loss: 1.1746 grad: 1.60e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.652 data: 0.0688 lr: 2.82e-05 mem: 47% pow: 634.957 W 0: INFO 26-04-29 21:57:29.514566 - 6:22:10 - step: 31060 acc: 0 loss: 1.4278 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6429 data: 0.0536 lr: 2.82e-05 mem: 47% pow: 646.814 W 0: INFO 26-04-29 21:57:43.592531 - 6:22:24 - step: 31070 acc: 0 loss: 1.232 grad: 1.64e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5895 data: 0.0966 lr: 2.82e-05 mem: 47% pow: 660.694 W 0: INFO 26-04-29 21:57:57.791517 - 6:22:38 - step: 31080 acc: 0 loss: 1.1215 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7438 data: 0.0917 lr: 2.82e-05 mem: 47% pow: 577.123 W 0: INFO 26-04-29 21:58:11.565035 - 6:22:52 - step: 31090 acc: 0 loss: 1.171 grad: 1.61e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.588 data: 0.0912 lr: 2.81e-05 mem: 47% pow: 661.107 W 0: INFO 26-04-29 21:58:25.210769 - 6:23:06 - step: 31100 acc: 0 loss: 1.5577 grad: 1.58e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6036 data: 0.0848 lr: 2.81e-05 mem: 47% pow: 667.194 W 0: INFO 26-04-29 21:58:42.144677 - 6:23:22 - step: 31110 acc: 0 loss: 1.2367 grad: 1.54e-01 flops: 3.34e+14 wps: 3.87e+04 iter: 0.6107 data: 0.088 lr: 2.81e-05 mem: 54% pow: 645.906 W 0: INFO 26-04-29 21:58:55.851234 - 6:23:36 - step: 31120 acc: 0 loss: 1.3334 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6126 data: 0.0826 lr: 2.81e-05 mem: 47% pow: 652.746 W 0: INFO 26-04-29 21:59:09.571831 - 6:23:50 - step: 31130 acc: 0 loss: 1.4504 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7671 data: 0.105 lr: 2.81e-05 mem: 47% pow: 557.203 W 0: INFO 26-04-29 21:59:23.396335 - 6:24:04 - step: 31140 acc: 0 loss: 1.3371 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6268 data: 0.061 lr: 2.81e-05 mem: 47% pow: 680.335 W 0: INFO 26-04-29 21:59:37.122368 - 6:24:17 - step: 31150 acc: 0 loss: 1.3691 grad: 1.59e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5942 data: 0.0884 lr: 2.81e-05 mem: 47% pow: 669.434 W 0: INFO 26-04-29 21:59:51.182703 - 6:24:31 - step: 31160 acc: 0 loss: 0.9918 grad: 1.61e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6108 data: 0.0829 lr: 2.80e-05 mem: 47% pow: 660.376 W 0: INFO 26-04-29 22:00:04.961492 - 6:24:45 - step: 31170 acc: 0 loss: 1.5058 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6164 data: 0.0868 lr: 2.80e-05 mem: 47% pow: 653.834 W 0: INFO 26-04-29 22:00:18.721883 - 6:24:59 - step: 31180 acc: 0 loss: 1.4572 grad: 1.52e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6341 data: 0.0474 lr: 2.80e-05 mem: 47% pow: 658.739 W 0: INFO 26-04-29 22:00:32.382608 - 6:25:13 - step: 31190 acc: 0 loss: 1.3602 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.624 data: 0.0783 lr: 2.80e-05 mem: 47% pow: 647.696 W 0: INFO 26-04-29 22:00:46.379422 - 6:25:27 - step: 31200 acc: 0 loss: 1.6331 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6227 data: 0.0884 lr: 2.80e-05 mem: 47% pow: 658.027 W 0: INFO 26-04-29 22:01:03.341226 - 6:25:44 - step: 31210 acc: 0 loss: 1.4184 grad: 1.55e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.5834 data: 0.0893 lr: 2.80e-05 mem: 54% pow: 668.995 W 0: INFO 26-04-29 22:01:17.194402 - 6:25:57 - step: 31220 acc: 0 loss: 1.3775 grad: 1.60e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5877 data: 0.0881 lr: 2.79e-05 mem: 47% pow: 662.828 W 0: INFO 26-04-29 22:01:31.740628 - 6:26:12 - step: 31230 acc: 0 loss: 1.4579 grad: 1.58e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6999 data: 0.0898 lr: 2.79e-05 mem: 47% pow: 602.833 W 0: INFO 26-04-29 22:01:45.572886 - 6:26:26 - step: 31240 acc: 0 loss: 0.9084 grad: 1.65e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5985 data: 0.091 lr: 2.79e-05 mem: 47% pow: 666.422 W 0: INFO 26-04-29 22:01:59.527597 - 6:26:40 - step: 31250 acc: 0 loss: 1.9328 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.8287 data: 0.0866 lr: 2.79e-05 mem: 47% pow: 544.599 W 0: INFO 26-04-29 22:02:13.403604 - 6:26:54 - step: 31260 acc: 0 loss: 1.2186 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6078 data: 0.0735 lr: 2.79e-05 mem: 47% pow: 657.969 W 0: INFO 26-04-29 22:02:27.334522 - 6:27:08 - step: 31270 acc: 0 loss: 1.678 grad: 1.60e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.5821 data: 0.0928 lr: 2.79e-05 mem: 47% pow: 669.555 W 0: INFO 26-04-29 22:02:41.257903 - 6:27:22 - step: 31280 acc: 0 loss: 1.1956 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6045 data: 0.0845 lr: 2.79e-05 mem: 47% pow: 652.644 W 0: INFO 26-04-29 22:02:55.345078 - 6:27:36 - step: 31290 acc: 0 loss: 1.7102 grad: 1.91e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6318 data: 0.0829 lr: 2.78e-05 mem: 47% pow: 652.453 W 0: INFO 26-04-29 22:03:09.234380 - 6:27:50 - step: 31300 acc: 0 loss: 1.252 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6251 data: 0.0818 lr: 2.78e-05 mem: 47% pow: 655.072 W 0: INFO 26-04-29 22:03:26.177211 - 6:28:06 - step: 31310 acc: 0 loss: 1.1489 grad: 1.60e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.5804 data: 0.1952 lr: 2.78e-05 mem: 54% pow: 605.646 W 0: INFO 26-04-29 22:03:39.798748 - 6:28:20 - step: 31320 acc: 0 loss: 1.5356 grad: 1.72e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6166 data: 0.0944 lr: 2.78e-05 mem: 47% pow: 644.207 W 0: INFO 26-04-29 22:03:53.601008 - 6:28:34 - step: 31330 acc: 0 loss: 1.2536 grad: 1.54e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.597 data: 0.0808 lr: 2.78e-05 mem: 47% pow: 665.637 W 0: INFO 26-04-29 22:04:07.567376 - 6:28:48 - step: 31340 acc: 0 loss: 1.452 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5964 data: 0.0856 lr: 2.78e-05 mem: 47% pow: 657.736 W 0: INFO 26-04-29 22:04:21.101242 - 6:29:01 - step: 31350 acc: 0 loss: 1.2285 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6225 data: 0.073 lr: 2.78e-05 mem: 47% pow: 652.795 W 0: INFO 26-04-29 22:04:35.146862 - 6:29:15 - step: 31360 acc: 0 loss: 1.5489 grad: 1.80e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6244 data: 0.097 lr: 2.77e-05 mem: 47% pow: 635.251 W 0: INFO 26-04-29 22:04:49.029844 - 6:29:29 - step: 31370 acc: 0 loss: 1.1983 grad: 1.56e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5947 data: 0.0889 lr: 2.77e-05 mem: 47% pow: 659.105 W 0: INFO 26-04-29 22:05:02.611989 - 6:29:43 - step: 31380 acc: 0 loss: 1.5955 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5959 data: 0.0883 lr: 2.77e-05 mem: 47% pow: 661.941 W 0: INFO 26-04-29 22:05:16.486223 - 6:29:57 - step: 31390 acc: 0 loss: 1.315 grad: 1.57e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5913 data: 0.088 lr: 2.77e-05 mem: 47% pow: 665.34 W 0: INFO 26-04-29 22:05:30.169810 - 6:30:10 - step: 31400 acc: 0 loss: 1.3951 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6177 data: 0.0889 lr: 2.77e-05 mem: 47% pow: 648.673 W 0: INFO 26-04-29 22:05:46.845867 - 6:30:27 - step: 31410 acc: 0 loss: 1.89 grad: 1.54e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6591 data: 0.0794 lr: 2.77e-05 mem: 54% pow: 627.431 W 0: INFO 26-04-29 22:06:01.853955 - 6:30:42 - step: 31420 acc: 0 loss: 1.431 grad: 1.58e-01 flops: 3.76e+14 wps: 4.37e+04 iter: 0.606 data: 0.0859 lr: 2.76e-05 mem: 47% pow: 664.044 W 0: INFO 26-04-29 22:06:15.390455 - 6:30:56 - step: 31430 acc: 0 loss: 1.4999 grad: 1.60e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6111 data: 0.088 lr: 2.76e-05 mem: 47% pow: 647.396 W 0: INFO 26-04-29 22:06:29.247740 - 6:31:10 - step: 31440 acc: 0 loss: 1.1446 grad: 1.59e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6283 data: 0.0761 lr: 2.76e-05 mem: 47% pow: 652.136 W 0: INFO 26-04-29 22:06:42.989963 - 6:31:23 - step: 31450 acc: 0 loss: 1.1732 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7329 data: 0.086 lr: 2.76e-05 mem: 47% pow: 585.162 W 0: INFO 26-04-29 22:06:56.854014 - 6:31:37 - step: 31460 acc: 0 loss: 1.3207 grad: 1.53e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5875 data: 0.0937 lr: 2.76e-05 mem: 47% pow: 659.419 W 0: INFO 26-04-29 22:07:10.878270 - 6:31:51 - step: 31470 acc: 0 loss: 1.2061 grad: 1.78e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5804 data: 0.1226 lr: 2.76e-05 mem: 47% pow: 650.836 W 0: INFO 26-04-29 22:07:25.118273 - 6:32:05 - step: 31480 acc: 0 loss: 1.5828 grad: 1.54e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6305 data: 0.052 lr: 2.76e-05 mem: 47% pow: 682.941 W 0: INFO 26-04-29 22:07:38.966103 - 6:32:19 - step: 31490 acc: 0 loss: 0.8787 grad: 1.61e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.643 data: 0.0793 lr: 2.75e-05 mem: 47% pow: 633.53 W 0: INFO 26-04-29 22:07:52.954086 - 6:32:33 - step: 31500 acc: 0 loss: 1.1205 grad: 1.55e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5805 data: 0.0914 lr: 2.75e-05 mem: 47% pow: 695.536 W 0: INFO 26-04-29 22:08:09.592647 - 6:32:50 - step: 31510 acc: 0 loss: 1.4503 grad: 1.54e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6003 data: 0.0868 lr: 2.75e-05 mem: 54% pow: 682.308 W 0: INFO 26-04-29 22:08:23.411021 - 6:33:04 - step: 31520 acc: 0 loss: 1.1957 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5929 data: 0.0901 lr: 2.75e-05 mem: 47% pow: 664.637 W 0: INFO 26-04-29 22:08:36.970841 - 6:33:17 - step: 31530 acc: 0 loss: 1.2679 grad: 1.61e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6113 data: 0.0899 lr: 2.75e-05 mem: 47% pow: 648.871 W 0: INFO 26-04-29 22:08:50.824703 - 6:33:31 - step: 31540 acc: 0 loss: 1.6557 grad: 1.53e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6021 data: 0.088 lr: 2.75e-05 mem: 47% pow: 665.09 W 0: INFO 26-04-29 22:09:04.420385 - 6:33:45 - step: 31550 acc: 0 loss: 1.3532 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5985 data: 0.0831 lr: 2.75e-05 mem: 47% pow: 661.459 W 0: INFO 26-04-29 22:09:18.806498 - 6:33:59 - step: 31560 acc: 0 loss: 1.2252 grad: 1.70e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5813 data: 0.2538 lr: 2.74e-05 mem: 47% pow: 575.148 W 0: INFO 26-04-29 22:09:32.918445 - 6:34:13 - step: 31570 acc: 0 loss: 1.4941 grad: 1.48e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.5979 data: 0.0854 lr: 2.74e-05 mem: 47% pow: 672.359 W 0: INFO 26-04-29 22:09:46.721791 - 6:34:27 - step: 31580 acc: 0 loss: 1.2029 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6069 data: 0.0881 lr: 2.74e-05 mem: 47% pow: 656.055 W 0: INFO 26-04-29 22:10:00.602449 - 6:34:41 - step: 31590 acc: 0 loss: 1.2751 grad: 1.56e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5918 data: 0.0795 lr: 2.74e-05 mem: 47% pow: 669.943 W 0: INFO 26-04-29 22:10:14.358288 - 6:34:55 - step: 31600 acc: 0 loss: 1.4221 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6163 data: 0.0884 lr: 2.74e-05 mem: 47% pow: 650.688 W 0: INFO 26-04-29 22:10:30.850209 - 6:35:11 - step: 31610 acc: 0 loss: 1.3146 grad: 1.50e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5787 data: 0.103 lr: 2.74e-05 mem: 54% pow: 662.621 W 0: INFO 26-04-29 22:10:44.502344 - 6:35:25 - step: 31620 acc: 0 loss: 1.3968 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6409 data: 0.0713 lr: 2.74e-05 mem: 47% pow: 648.091 W 0: INFO 26-04-29 22:10:58.689489 - 6:35:39 - step: 31630 acc: 0 loss: 1.4386 grad: 1.58e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7196 data: 0.0802 lr: 2.73e-05 mem: 47% pow: 583.228 W 0: INFO 26-04-29 22:11:12.578541 - 6:35:53 - step: 31640 acc: 0 loss: 1.194 grad: 1.49e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6372 data: 0.0855 lr: 2.73e-05 mem: 47% pow: 642.482 W 0: INFO 26-04-29 22:11:26.310602 - 6:36:07 - step: 31650 acc: 0 loss: 1.7879 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5865 data: 0.0902 lr: 2.73e-05 mem: 47% pow: 661.818 W 0: INFO 26-04-29 22:11:40.089299 - 6:36:20 - step: 31660 acc: 0 loss: 1.3137 grad: 1.61e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6015 data: 0.0816 lr: 2.73e-05 mem: 47% pow: 661.905 W 0: INFO 26-04-29 22:11:53.755916 - 6:36:34 - step: 31670 acc: 0 loss: 1.445 grad: 1.64e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6008 data: 0.0875 lr: 2.73e-05 mem: 47% pow: 663.879 W 0: INFO 26-04-29 22:12:07.386722 - 6:36:48 - step: 31680 acc: 0 loss: 1.3273 grad: 1.54e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5953 data: 0.0834 lr: 2.73e-05 mem: 47% pow: 667.629 W 0: INFO 26-04-29 22:12:21.413224 - 6:37:02 - step: 31690 acc: 0 loss: 1.2554 grad: 1.50e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.7003 data: 0.0768 lr: 2.72e-05 mem: 47% pow: 599.137 W 0: INFO 26-04-29 22:12:34.932874 - 6:37:15 - step: 31700 acc: 0 loss: 1.2477 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5779 data: 0.0854 lr: 2.72e-05 mem: 47% pow: 677.496 W 0: INFO 26-04-29 22:12:51.530062 - 6:37:32 - step: 31710 acc: 0 loss: 1.02 grad: 1.55e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6123 data: 0.0804 lr: 2.72e-05 mem: 54% pow: 657.462 W 0: INFO 26-04-29 22:13:05.433506 - 6:37:46 - step: 31720 acc: 0 loss: 1.5431 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5787 data: 0.2274 lr: 2.72e-05 mem: 47% pow: 594.58 W 0: INFO 26-04-29 22:13:19.166179 - 6:37:59 - step: 31730 acc: 0 loss: 1.375 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6037 data: 0.0902 lr: 2.72e-05 mem: 47% pow: 649.95 W 0: INFO 26-04-29 22:13:32.917772 - 6:38:13 - step: 31740 acc: 0 loss: 1.5352 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6093 data: 0.0724 lr: 2.72e-05 mem: 47% pow: 664.092 W 0: INFO 26-04-29 22:13:46.980777 - 6:38:27 - step: 31750 acc: 0 loss: 1.1477 grad: 1.49e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6187 data: 0.0751 lr: 2.72e-05 mem: 47% pow: 658.151 W 0: INFO 26-04-29 22:14:00.754962 - 6:38:41 - step: 31760 acc: 0 loss: 1.2399 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6733 data: 0.0863 lr: 2.71e-05 mem: 47% pow: 609.05 W 0: INFO 26-04-29 22:14:14.550498 - 6:38:55 - step: 31770 acc: 0 loss: 1.5894 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6098 data: 0.0808 lr: 2.71e-05 mem: 47% pow: 678.299 W 0: INFO 26-04-29 22:14:28.308856 - 6:39:09 - step: 31780 acc: 0 loss: 1.7547 grad: 1.43e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6188 data: 0.066 lr: 2.71e-05 mem: 47% pow: 672.463 W 0: INFO 26-04-29 22:14:41.941009 - 6:39:22 - step: 31790 acc: 0 loss: 1.7178 grad: 1.49e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6141 data: 0.0918 lr: 2.71e-05 mem: 47% pow: 656.814 W 0: INFO 26-04-29 22:14:55.869677 - 6:39:36 - step: 31800 acc: 0 loss: 1.7137 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6077 data: 0.0832 lr: 2.71e-05 mem: 47% pow: 660.35 W 0: INFO 26-04-29 22:15:12.985433 - 6:39:53 - step: 31810 acc: 0 loss: 1.3702 grad: 1.46e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6146 data: 0.0809 lr: 2.71e-05 mem: 54% pow: 655.485 W 0: INFO 26-04-29 22:15:26.811750 - 6:40:07 - step: 31820 acc: 0 loss: 1.4224 grad: 1.42e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5982 data: 0.0863 lr: 2.71e-05 mem: 47% pow: 664.166 W 0: INFO 26-04-29 22:15:40.597537 - 6:40:21 - step: 31830 acc: 0 loss: 1.4894 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6678 data: 0.0723 lr: 2.70e-05 mem: 47% pow: 627.453 W 0: INFO 26-04-29 22:15:54.552173 - 6:40:35 - step: 31840 acc: 0 loss: 1.4244 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5965 data: 0.0888 lr: 2.70e-05 mem: 47% pow: 671.348 W 0: INFO 26-04-29 22:16:08.565603 - 6:40:49 - step: 31850 acc: 0 loss: 1.581 grad: 1.50e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6022 data: 0.0823 lr: 2.70e-05 mem: 47% pow: 659.847 W 0: INFO 26-04-29 22:16:22.109394 - 6:41:02 - step: 31860 acc: 0 loss: 1.4721 grad: 1.52e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5926 data: 0.0803 lr: 2.70e-05 mem: 47% pow: 666.604 W 0: INFO 26-04-29 22:16:35.917219 - 6:41:16 - step: 31870 acc: 0 loss: 1.4504 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6154 data: 0.0939 lr: 2.70e-05 mem: 47% pow: 654.072 W 0: INFO 26-04-29 22:16:49.687078 - 6:41:30 - step: 31880 acc: 0 loss: 1.6496 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.621 data: 0.0877 lr: 2.70e-05 mem: 47% pow: 655.931 W 0: INFO 26-04-29 22:17:03.481662 - 6:41:44 - step: 31890 acc: 0 loss: 0.9743 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6015 data: 0.0731 lr: 2.69e-05 mem: 47% pow: 673.629 W 0: INFO 26-04-29 22:17:17.208604 - 6:41:58 - step: 31900 acc: 0 loss: 1.4183 grad: 1.51e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5968 data: 0.0817 lr: 2.69e-05 mem: 47% pow: 670.368 W 0: INFO 26-04-29 22:17:33.992063 - 6:42:14 - step: 31910 acc: 0 loss: 1.2062 grad: 1.48e-01 flops: 3.36e+14 wps: 3.91e+04 iter: 0.6184 data: 0.0657 lr: 2.69e-05 mem: 54% pow: 664.508 W 0: INFO 26-04-29 22:17:47.831263 - 6:42:28 - step: 31920 acc: 0 loss: 1.7061 grad: 1.47e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6017 data: 0.0719 lr: 2.69e-05 mem: 47% pow: 665.179 W 0: INFO 26-04-29 22:18:01.691468 - 6:42:42 - step: 31930 acc: 0 loss: 1.5527 grad: 1.50e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5979 data: 0.1036 lr: 2.69e-05 mem: 47% pow: 656.649 W 0: INFO 26-04-29 22:18:15.537245 - 6:42:56 - step: 31940 acc: 0 loss: 1.4868 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5918 data: 0.0888 lr: 2.69e-05 mem: 47% pow: 665.943 W 0: INFO 26-04-29 22:18:29.293245 - 6:43:10 - step: 31950 acc: 0 loss: 1.2742 grad: 1.64e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5881 data: 0.086 lr: 2.69e-05 mem: 47% pow: 659.974 W 0: INFO 26-04-29 22:18:43.074708 - 6:43:23 - step: 31960 acc: 0 loss: 1.3055 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5989 data: 0.0872 lr: 2.68e-05 mem: 47% pow: 664.077 W 0: INFO 26-04-29 22:18:56.857890 - 6:43:37 - step: 31970 acc: 0 loss: 1.4309 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6122 data: 0.0897 lr: 2.68e-05 mem: 47% pow: 646.0 W 0: INFO 26-04-29 22:19:10.723031 - 6:43:51 - step: 31980 acc: 0 loss: 1.4839 grad: 1.50e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6063 data: 0.091 lr: 2.68e-05 mem: 47% pow: 662.831 W 0: INFO 26-04-29 22:19:24.877598 - 6:44:05 - step: 31990 acc: 0 loss: 1.5277 grad: 1.49e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5932 data: 0.0864 lr: 2.68e-05 mem: 47% pow: 659.561 W 0: INFO 26-04-29 22:19:38.844788 - 6:44:19 - step: 32000 acc: 0 loss: 1.6667 grad: 1.48e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6068 data: 0.0875 lr: 2.68e-05 mem: 47% pow: 655.076 W 0: INFO 26-04-29 22:19:42.593546 - 6:44:23 - garbage collection 0: INFO 26-04-29 22:19:57.347464 - 6:44:38 - step: 32010 acc: 0 loss: 1.1479 grad: 1.52e-01 flops: 3.05e+14 wps: 3.54e+04 iter: 0.6531 data: 0.078 lr: 2.68e-05 mem: 54% pow: 643.064 W 0: INFO 26-04-29 22:20:11.150635 - 6:44:51 - step: 32020 acc: 0 loss: 1.3859 grad: 1.55e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5903 data: 0.0907 lr: 2.68e-05 mem: 47% pow: 657.143 W 0: INFO 26-04-29 22:20:24.885832 - 6:45:05 - step: 32030 acc: 0 loss: 1.2327 grad: 1.42e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5806 data: 0.0909 lr: 2.67e-05 mem: 47% pow: 663.885 W 0: INFO 26-04-29 22:20:38.935699 - 6:45:19 - step: 32040 acc: 0 loss: 1.4795 grad: 1.55e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6293 data: 0.0893 lr: 2.67e-05 mem: 47% pow: 641.547 W 0: INFO 26-04-29 22:20:52.877887 - 6:45:33 - step: 32050 acc: 0 loss: 1.1416 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5927 data: 0.0864 lr: 2.67e-05 mem: 47% pow: 660.086 W 0: INFO 26-04-29 22:21:06.865870 - 6:45:47 - step: 32060 acc: 0 loss: 1.2417 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6975 data: 0.0901 lr: 2.67e-05 mem: 47% pow: 596.702 W 0: INFO 26-04-29 22:21:20.466397 - 6:46:01 - step: 32070 acc: 0 loss: 1.4866 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5795 data: 0.0974 lr: 2.67e-05 mem: 47% pow: 666.351 W 0: INFO 26-04-29 22:21:34.086024 - 6:46:14 - step: 32080 acc: 0 loss: 1.2415 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5801 data: 0.1035 lr: 2.67e-05 mem: 47% pow: 662.951 W 0: INFO 26-04-29 22:21:47.734023 - 6:46:28 - step: 32090 acc: 0 loss: 1.268 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6192 data: 0.0889 lr: 2.67e-05 mem: 47% pow: 660.497 W 0: INFO 26-04-29 22:22:01.858936 - 6:46:42 - step: 32100 acc: 0 loss: 1.4757 grad: 1.55e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6043 data: 0.0769 lr: 2.66e-05 mem: 47% pow: 669.377 W 0: INFO 26-04-29 22:22:18.299087 - 6:46:59 - step: 32110 acc: 0 loss: 1.7532 grad: 1.45e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.5833 data: 0.0859 lr: 2.66e-05 mem: 54% pow: 669.874 W 0: INFO 26-04-29 22:22:31.781337 - 6:47:12 - step: 32120 acc: 0 loss: 1.4147 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5949 data: 0.0899 lr: 2.66e-05 mem: 47% pow: 665.579 W 0: INFO 26-04-29 22:22:45.262124 - 6:47:26 - step: 32130 acc: 0 loss: 1.6839 grad: 1.47e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5941 data: 0.0869 lr: 2.66e-05 mem: 47% pow: 665.874 W 0: INFO 26-04-29 22:22:58.769310 - 6:47:39 - step: 32140 acc: 0 loss: 1.5141 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6045 data: 0.0899 lr: 2.66e-05 mem: 47% pow: 652.37 W 0: INFO 26-04-29 22:23:12.409545 - 6:47:53 - step: 32150 acc: 0 loss: 1.2769 grad: 1.46e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6098 data: 0.0839 lr: 2.66e-05 mem: 47% pow: 660.008 W 0: INFO 26-04-29 22:23:26.179687 - 6:48:06 - step: 32160 acc: 0 loss: 1.4837 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6292 data: 0.0591 lr: 2.65e-05 mem: 47% pow: 663.679 W 0: INFO 26-04-29 22:23:40.010293 - 6:48:20 - step: 32170 acc: 0 loss: 1.6952 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6059 data: 0.0857 lr: 2.65e-05 mem: 47% pow: 661.522 W 0: INFO 26-04-29 22:23:53.483948 - 6:48:34 - step: 32180 acc: 0 loss: 1.2961 grad: 1.43e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5832 data: 0.099 lr: 2.65e-05 mem: 47% pow: 661.794 W 0: INFO 26-04-29 22:24:07.584852 - 6:48:48 - step: 32190 acc: 0 loss: 1.3805 grad: 1.58e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6184 data: 0.0931 lr: 2.65e-05 mem: 47% pow: 638.852 W 0: INFO 26-04-29 22:24:21.421225 - 6:49:02 - step: 32200 acc: 0 loss: 2.1621 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6198 data: 0.0906 lr: 2.65e-05 mem: 47% pow: 648.845 W 0: INFO 26-04-29 22:24:37.907122 - 6:49:18 - step: 32210 acc: 0 loss: 1.1787 grad: 1.45e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6473 data: 0.0838 lr: 2.65e-05 mem: 54% pow: 636.362 W 0: INFO 26-04-29 22:24:51.403900 - 6:49:32 - step: 32220 acc: 0 loss: 1.1499 grad: 1.49e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.62 data: 0.0891 lr: 2.65e-05 mem: 47% pow: 646.855 W 0: INFO 26-04-29 22:25:05.008546 - 6:49:45 - step: 32230 acc: 0 loss: 1.6195 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5897 data: 0.0777 lr: 2.64e-05 mem: 47% pow: 675.745 W 0: INFO 26-04-29 22:25:18.673477 - 6:49:59 - step: 32240 acc: 0 loss: 1.7448 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5877 data: 0.0934 lr: 2.64e-05 mem: 47% pow: 661.403 W 0: INFO 26-04-29 22:25:32.502821 - 6:50:13 - step: 32250 acc: 0 loss: 1.2112 grad: 1.51e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6331 data: 0.0864 lr: 2.64e-05 mem: 47% pow: 636.656 W 0: INFO 26-04-29 22:25:46.953970 - 6:50:27 - step: 32260 acc: 0 loss: 1.7538 grad: 1.49e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6255 data: 0.0882 lr: 2.64e-05 mem: 47% pow: 642.769 W 0: INFO 26-04-29 22:26:01.173815 - 6:50:41 - step: 32270 acc: 0 loss: 1.4923 grad: 1.53e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.5913 data: 0.0894 lr: 2.64e-05 mem: 47% pow: 668.874 W 0: INFO 26-04-29 22:26:14.723011 - 6:50:55 - step: 32280 acc: 0 loss: 1.3899 grad: 1.47e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6553 data: 0.0649 lr: 2.64e-05 mem: 47% pow: 635.846 W 0: INFO 26-04-29 22:26:28.350447 - 6:51:09 - step: 32290 acc: 0 loss: 1.4778 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6124 data: 0.117 lr: 2.64e-05 mem: 47% pow: 640.953 W 0: INFO 26-04-29 22:26:42.233438 - 6:51:23 - step: 32300 acc: 0 loss: 1.5499 grad: 1.47e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6612 data: 0.0179 lr: 2.63e-05 mem: 47% pow: 666.99 W 0: INFO 26-04-29 22:26:58.847585 - 6:51:39 - step: 32310 acc: 0 loss: 1.3448 grad: 1.60e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.5957 data: 0.0925 lr: 2.63e-05 mem: 54% pow: 668.738 W 0: INFO 26-04-29 22:27:12.573982 - 6:51:53 - step: 32320 acc: 0 loss: 1.4738 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6061 data: 0.0848 lr: 2.63e-05 mem: 47% pow: 655.29 W 0: INFO 26-04-29 22:27:26.193020 - 6:52:06 - step: 32330 acc: 0 loss: 1.1731 grad: 1.42e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6079 data: 0.0898 lr: 2.63e-05 mem: 47% pow: 649.126 W 0: INFO 26-04-29 22:27:39.895485 - 6:52:20 - step: 32340 acc: 0 loss: 1.1075 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5927 data: 0.0892 lr: 2.63e-05 mem: 47% pow: 660.405 W 0: INFO 26-04-29 22:27:53.737828 - 6:52:34 - step: 32350 acc: 0 loss: 1.2192 grad: 1.46e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5956 data: 0.0827 lr: 2.63e-05 mem: 47% pow: 656.566 W 0: INFO 26-04-29 22:28:07.391860 - 6:52:48 - step: 32360 acc: 0 loss: 1.2771 grad: 1.66e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.595 data: 0.0839 lr: 2.62e-05 mem: 47% pow: 659.634 W 0: INFO 26-04-29 22:28:20.886953 - 6:53:01 - step: 32370 acc: 0 loss: 1.1276 grad: 1.61e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5929 data: 0.0934 lr: 2.62e-05 mem: 47% pow: 681.308 W 0: INFO 26-04-29 22:28:34.568223 - 6:53:15 - step: 32380 acc: 0 loss: 1.4575 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.7321 data: 0.0832 lr: 2.62e-05 mem: 47% pow: 588.112 W 0: INFO 26-04-29 22:28:48.052483 - 6:53:28 - step: 32390 acc: 0 loss: 1.3054 grad: 1.44e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6253 data: 0.0885 lr: 2.62e-05 mem: 47% pow: 649.232 W 0: INFO 26-04-29 22:29:01.774913 - 6:53:42 - step: 32400 acc: 0 loss: 1.5424 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6785 data: 0.0941 lr: 2.62e-05 mem: 47% pow: 612.764 W 0: INFO 26-04-29 22:29:18.299976 - 6:53:59 - step: 32410 acc: 0 loss: 1.8387 grad: 1.48e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.588 data: 0.088 lr: 2.62e-05 mem: 54% pow: 665.775 W 0: INFO 26-04-29 22:29:31.984246 - 6:54:12 - step: 32420 acc: 0 loss: 1.513 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6357 data: 0.0767 lr: 2.62e-05 mem: 47% pow: 651.105 W 0: INFO 26-04-29 22:29:45.674530 - 6:54:26 - step: 32430 acc: 0 loss: 1.4821 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6111 data: 0.0882 lr: 2.61e-05 mem: 47% pow: 644.757 W 0: INFO 26-04-29 22:29:59.227420 - 6:54:40 - step: 32440 acc: 0 loss: 1.2891 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6085 data: 0.0832 lr: 2.61e-05 mem: 47% pow: 663.472 W 0: INFO 26-04-29 22:30:12.689442 - 6:54:53 - step: 32450 acc: 0 loss: 1.3266 grad: 1.49e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5782 data: 0.1171 lr: 2.61e-05 mem: 47% pow: 655.005 W 0: INFO 26-04-29 22:30:26.295796 - 6:55:07 - step: 32460 acc: 0 loss: 1.8865 grad: 1.47e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.607 data: 0.0795 lr: 2.61e-05 mem: 47% pow: 660.821 W 0: INFO 26-04-29 22:30:39.797600 - 6:55:20 - step: 32470 acc: 0 loss: 1.2936 grad: 1.50e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6225 data: 0.091 lr: 2.61e-05 mem: 47% pow: 646.98 W 0: INFO 26-04-29 22:30:53.598064 - 6:55:34 - step: 32480 acc: 0 loss: 1.3945 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5838 data: 0.094 lr: 2.61e-05 mem: 47% pow: 667.8 W 0: INFO 26-04-29 22:31:07.401024 - 6:55:48 - step: 32490 acc: 0 loss: 1.0748 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5943 data: 0.0866 lr: 2.61e-05 mem: 47% pow: 659.826 W 0: INFO 26-04-29 22:31:21.081093 - 6:56:01 - step: 32500 acc: 0 loss: 1.4945 grad: 1.45e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6198 data: 0.0787 lr: 2.60e-05 mem: 47% pow: 649.498 W 0: INFO 26-04-29 22:31:37.920429 - 6:56:18 - step: 32510 acc: 0 loss: 1.3432 grad: 1.50e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.6002 data: 0.0849 lr: 2.60e-05 mem: 54% pow: 665.714 W 0: INFO 26-04-29 22:31:51.361620 - 6:56:32 - step: 32520 acc: 0 loss: 1.8317 grad: 1.48e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6033 data: 0.0849 lr: 2.60e-05 mem: 47% pow: 660.123 W 0: INFO 26-04-29 22:32:04.905519 - 6:56:45 - step: 32530 acc: 0 loss: 1.2502 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6108 data: 0.0891 lr: 2.60e-05 mem: 47% pow: 653.035 W 0: INFO 26-04-29 22:32:18.461942 - 6:56:59 - step: 32540 acc: 0 loss: 1.3626 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5946 data: 0.0848 lr: 2.60e-05 mem: 47% pow: 660.495 W 0: INFO 26-04-29 22:32:32.091210 - 6:57:12 - step: 32550 acc: 0 loss: 1.7195 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5869 data: 0.0835 lr: 2.60e-05 mem: 47% pow: 673.011 W 0: INFO 26-04-29 22:32:45.810746 - 6:57:26 - step: 32560 acc: 0 loss: 1.2886 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6473 data: 0.0893 lr: 2.60e-05 mem: 47% pow: 626.007 W 0: INFO 26-04-29 22:32:59.421746 - 6:57:40 - step: 32570 acc: 0 loss: 1.017 grad: 1.46e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5975 data: 0.0852 lr: 2.59e-05 mem: 47% pow: 668.377 W 0: INFO 26-04-29 22:33:13.001437 - 6:57:53 - step: 32580 acc: 0 loss: 1.2485 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5897 data: 0.0857 lr: 2.59e-05 mem: 47% pow: 665.003 W 0: INFO 26-04-29 22:33:26.815191 - 6:58:07 - step: 32590 acc: 0 loss: 1.638 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6055 data: 0.0843 lr: 2.59e-05 mem: 47% pow: 656.274 W 0: INFO 26-04-29 22:33:40.368950 - 6:58:21 - step: 32600 acc: 0 loss: 1.4458 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6528 data: 0.0517 lr: 2.59e-05 mem: 47% pow: 660.317 W 0: INFO 26-04-29 22:33:56.765326 - 6:58:37 - step: 32610 acc: 0 loss: 1.3464 grad: 1.49e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.5931 data: 0.0878 lr: 2.59e-05 mem: 54% pow: 661.715 W 0: INFO 26-04-29 22:34:10.355589 - 6:58:51 - step: 32620 acc: 0 loss: 1.3309 grad: 1.60e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5814 data: 0.1533 lr: 2.59e-05 mem: 47% pow: 628.877 W 0: INFO 26-04-29 22:34:23.973788 - 6:59:04 - step: 32630 acc: 0 loss: 1.473 grad: 1.45e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6486 data: 0.0456 lr: 2.58e-05 mem: 47% pow: 662.583 W 0: INFO 26-04-29 22:34:37.856782 - 6:59:18 - step: 32640 acc: 0 loss: 1.4158 grad: 1.49e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6336 data: 0.0799 lr: 2.58e-05 mem: 47% pow: 642.843 W 0: INFO 26-04-29 22:34:51.703153 - 6:59:32 - step: 32650 acc: 0 loss: 1.8868 grad: 1.47e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6094 data: 0.0777 lr: 2.58e-05 mem: 47% pow: 671.733 W 0: INFO 26-04-29 22:35:05.725415 - 6:59:46 - step: 32660 acc: 0 loss: 1.3005 grad: 1.52e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.606 data: 0.0846 lr: 2.58e-05 mem: 47% pow: 661.777 W 0: INFO 26-04-29 22:35:19.296093 - 7:00:00 - step: 32670 acc: 0 loss: 1.7714 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6004 data: 0.0896 lr: 2.58e-05 mem: 47% pow: 657.21 W 0: INFO 26-04-29 22:35:32.837393 - 7:00:13 - step: 32680 acc: 0 loss: 1.2249 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5957 data: 0.0839 lr: 2.58e-05 mem: 47% pow: 657.673 W 0: INFO 26-04-29 22:35:46.448302 - 7:00:27 - step: 32690 acc: 0 loss: 1.3228 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5911 data: 0.0826 lr: 2.58e-05 mem: 47% pow: 674.232 W 0: INFO 26-04-29 22:36:00.354453 - 7:00:41 - step: 32700 acc: 0 loss: 1.6054 grad: 1.49e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6089 data: 0.085 lr: 2.57e-05 mem: 47% pow: 665.978 W 0: INFO 26-04-29 22:36:16.805841 - 7:00:57 - step: 32710 acc: 0 loss: 1.4436 grad: 1.76e-01 flops: 3.43e+14 wps: 3.99e+04 iter: 0.5925 data: 0.1103 lr: 2.57e-05 mem: 54% pow: 648.831 W 0: INFO 26-04-29 22:36:30.408700 - 7:01:11 - step: 32720 acc: 0 loss: 1.4848 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6033 data: 0.0898 lr: 2.57e-05 mem: 47% pow: 653.876 W 0: INFO 26-04-29 22:36:43.921603 - 7:01:24 - step: 32730 acc: 0 loss: 1.2912 grad: 1.54e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6068 data: 0.0752 lr: 2.57e-05 mem: 47% pow: 663.57 W 0: INFO 26-04-29 22:36:57.509788 - 7:01:38 - step: 32740 acc: 0 loss: 1.3271 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6053 data: 0.0871 lr: 2.57e-05 mem: 47% pow: 665.149 W 0: INFO 26-04-29 22:37:11.161078 - 7:01:51 - step: 32750 acc: 0 loss: 1.2064 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5875 data: 0.0986 lr: 2.57e-05 mem: 47% pow: 670.896 W 0: INFO 26-04-29 22:37:24.698125 - 7:02:05 - step: 32760 acc: 0 loss: 1.8235 grad: 1.61e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5937 data: 0.1023 lr: 2.57e-05 mem: 47% pow: 646.523 W 0: INFO 26-04-29 22:37:38.510519 - 7:02:19 - step: 32770 acc: 0 loss: 1.6884 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6417 data: 0.0907 lr: 2.56e-05 mem: 47% pow: 624.617 W 0: INFO 26-04-29 22:37:52.156443 - 7:02:32 - step: 32780 acc: 0 loss: 1.2308 grad: 1.56e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5924 data: 0.0882 lr: 2.56e-05 mem: 47% pow: 657.683 W 0: INFO 26-04-29 22:38:06.381821 - 7:02:47 - step: 32790 acc: 0 loss: 1.37 grad: 1.45e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.5932 data: 0.0838 lr: 2.56e-05 mem: 47% pow: 661.552 W 0: INFO 26-04-29 22:38:20.209414 - 7:03:01 - step: 32800 acc: 0 loss: 1.3041 grad: 1.54e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6071 data: 0.0819 lr: 2.56e-05 mem: 47% pow: 657.698 W 0: INFO 26-04-29 22:38:36.747173 - 7:03:17 - step: 32810 acc: 0 loss: 1.6209 grad: 1.80e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6295 data: 0.0829 lr: 2.56e-05 mem: 54% pow: 641.145 W 0: INFO 26-04-29 22:38:50.206516 - 7:03:31 - step: 32820 acc: 0 loss: 1.5676 grad: 1.53e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5925 data: 0.0889 lr: 2.56e-05 mem: 47% pow: 660.037 W 0: INFO 26-04-29 22:39:03.845304 - 7:03:44 - step: 32830 acc: 0 loss: 1.5132 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6592 data: 0.0843 lr: 2.56e-05 mem: 47% pow: 627.062 W 0: INFO 26-04-29 22:39:17.484256 - 7:03:58 - step: 32840 acc: 0 loss: 1.2679 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5948 data: 0.0842 lr: 2.55e-05 mem: 47% pow: 665.884 W 0: INFO 26-04-29 22:39:31.070531 - 7:04:11 - step: 32850 acc: 0 loss: 1.5534 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6011 data: 0.0888 lr: 2.55e-05 mem: 47% pow: 652.359 W 0: INFO 26-04-29 22:39:44.612476 - 7:04:25 - step: 32860 acc: 0 loss: 1.0659 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5865 data: 0.0857 lr: 2.55e-05 mem: 47% pow: 671.209 W 0: INFO 26-04-29 22:39:58.334961 - 7:04:39 - step: 32870 acc: 0 loss: 1.1296 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6108 data: 0.0873 lr: 2.55e-05 mem: 47% pow: 643.219 W 0: INFO 26-04-29 22:40:11.932862 - 7:04:52 - step: 32880 acc: 0 loss: 1.276 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6857 data: 0.0873 lr: 2.55e-05 mem: 47% pow: 621.88 W 0: INFO 26-04-29 22:40:25.544974 - 7:05:06 - step: 32890 acc: 0 loss: 1.1901 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5825 data: 0.094 lr: 2.55e-05 mem: 47% pow: 659.379 W 0: INFO 26-04-29 22:40:39.104796 - 7:05:19 - step: 32900 acc: 0 loss: 1.2115 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5907 data: 0.0894 lr: 2.54e-05 mem: 47% pow: 663.134 W 0: INFO 26-04-29 22:40:55.677442 - 7:05:36 - step: 32910 acc: 0 loss: 0.8963 grad: 1.50e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6289 data: 0.0869 lr: 2.54e-05 mem: 54% pow: 636.076 W 0: INFO 26-04-29 22:41:09.213210 - 7:05:50 - step: 32920 acc: 0 loss: 1.4323 grad: 1.45e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.585 data: 0.085 lr: 2.54e-05 mem: 47% pow: 665.045 W 0: INFO 26-04-29 22:41:22.934040 - 7:06:03 - step: 32930 acc: 0 loss: 1.3988 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6034 data: 0.0861 lr: 2.54e-05 mem: 47% pow: 661.512 W 0: INFO 26-04-29 22:41:36.397031 - 7:06:17 - step: 32940 acc: 0 loss: 1.2849 grad: 1.48e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.629 data: 0.0832 lr: 2.54e-05 mem: 47% pow: 646.867 W 0: INFO 26-04-29 22:41:50.145072 - 7:06:30 - step: 32950 acc: 0 loss: 1.6132 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.617 data: 0.1051 lr: 2.54e-05 mem: 47% pow: 631.563 W 0: INFO 26-04-29 22:42:03.664765 - 7:06:44 - step: 32960 acc: 0 loss: 1.4738 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5911 data: 0.0782 lr: 2.54e-05 mem: 47% pow: 670.746 W 0: INFO 26-04-29 22:42:17.351322 - 7:06:58 - step: 32970 acc: 0 loss: 1.2295 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6206 data: 0.0933 lr: 2.53e-05 mem: 47% pow: 649.359 W 0: INFO 26-04-29 22:42:31.013502 - 7:07:11 - step: 32980 acc: 0 loss: 1.615 grad: 1.44e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6179 data: 0.0909 lr: 2.53e-05 mem: 47% pow: 645.383 W 0: INFO 26-04-29 22:42:44.660368 - 7:07:25 - step: 32990 acc: 0 loss: 1.2781 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6027 data: 0.0902 lr: 2.53e-05 mem: 47% pow: 651.977 W 0: INFO 26-04-29 22:42:58.137112 - 7:07:38 - step: 33000 acc: 0 loss: 1.2602 grad: 1.45e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5867 data: 0.0878 lr: 2.53e-05 mem: 47% pow: 665.287 W 0: INFO 26-04-29 22:43:01.849945 - 7:07:42 - garbage collection 0: INFO 26-04-29 22:43:16.607392 - 7:07:57 - step: 33010 acc: 0 loss: 1.5967 grad: 1.51e-01 flops: 3.06e+14 wps: 3.55e+04 iter: 0.6583 data: 0.0855 lr: 2.53e-05 mem: 54% pow: 631.915 W 0: INFO 26-04-29 22:43:30.430253 - 7:08:11 - step: 33020 acc: 0 loss: 1.389 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.598 data: 0.0862 lr: 2.53e-05 mem: 47% pow: 667.103 W 0: INFO 26-04-29 22:43:44.028497 - 7:08:24 - step: 33030 acc: 0 loss: 1.0384 grad: 1.43e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6167 data: 0.0709 lr: 2.53e-05 mem: 47% pow: 663.346 W 0: INFO 26-04-29 22:43:57.859463 - 7:08:38 - step: 33040 acc: 0 loss: 1.7092 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6143 data: 0.0786 lr: 2.52e-05 mem: 47% pow: 658.406 W 0: INFO 26-04-29 22:44:11.737935 - 7:08:52 - step: 33050 acc: 0 loss: 1.3238 grad: 1.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6257 data: 0.075 lr: 2.52e-05 mem: 47% pow: 645.283 W 0: INFO 26-04-29 22:44:25.424797 - 7:09:06 - step: 33060 acc: 0 loss: 1.4086 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5954 data: 0.096 lr: 2.52e-05 mem: 47% pow: 673.694 W 0: INFO 26-04-29 22:44:38.957536 - 7:09:19 - step: 33070 acc: 0 loss: 1.548 grad: 1.53e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6083 data: 0.0851 lr: 2.52e-05 mem: 47% pow: 653.317 W 0: INFO 26-04-29 22:44:52.587579 - 7:09:33 - step: 33080 acc: 0 loss: 1.4969 grad: 1.54e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6217 data: 0.0755 lr: 2.52e-05 mem: 47% pow: 662.782 W 0: INFO 26-04-29 22:45:06.428240 - 7:09:47 - step: 33090 acc: 0 loss: 1.313 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6175 data: 0.0642 lr: 2.52e-05 mem: 47% pow: 659.935 W 0: INFO 26-04-29 22:45:20.089535 - 7:10:00 - step: 33100 acc: 0 loss: 1.9465 grad: 1.46e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5994 data: 0.0901 lr: 2.51e-05 mem: 47% pow: 671.203 W 0: INFO 26-04-29 22:45:36.805929 - 7:10:17 - step: 33110 acc: 0 loss: 1.2442 grad: 1.47e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6794 data: 0.0839 lr: 2.51e-05 mem: 54% pow: 608.478 W 0: INFO 26-04-29 22:45:50.556563 - 7:10:31 - step: 33120 acc: 0 loss: 1.2236 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6055 data: 0.0843 lr: 2.51e-05 mem: 47% pow: 666.052 W 0: INFO 26-04-29 22:46:04.484630 - 7:10:45 - step: 33130 acc: 0 loss: 1.2789 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6264 data: 0.0867 lr: 2.51e-05 mem: 47% pow: 640.009 W 0: INFO 26-04-29 22:46:18.304551 - 7:10:59 - step: 33140 acc: 0 loss: 1.1687 grad: 1.52e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6077 data: 0.079 lr: 2.51e-05 mem: 47% pow: 661.839 W 0: INFO 26-04-29 22:46:31.822383 - 7:11:12 - step: 33150 acc: 0 loss: 1.1513 grad: 1.54e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6058 data: 0.0761 lr: 2.51e-05 mem: 47% pow: 674.108 W 0: INFO 26-04-29 22:46:45.279105 - 7:11:26 - step: 33160 acc: 0 loss: 1.123 grad: 1.43e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5913 data: 0.0824 lr: 2.51e-05 mem: 47% pow: 666.781 W 0: INFO 26-04-29 22:46:58.872379 - 7:11:39 - step: 33170 acc: 0 loss: 1.5208 grad: 1.45e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6015 data: 0.089 lr: 2.50e-05 mem: 47% pow: 667.418 W 0: INFO 26-04-29 22:47:12.596218 - 7:11:53 - step: 33180 acc: 0 loss: 1.5463 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6273 data: 0.086 lr: 2.50e-05 mem: 47% pow: 651.906 W 0: INFO 26-04-29 22:47:26.177200 - 7:12:06 - step: 33190 acc: 0 loss: 1.4871 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6373 data: 0.0821 lr: 2.50e-05 mem: 47% pow: 636.318 W 0: INFO 26-04-29 22:47:39.881292 - 7:12:20 - step: 33200 acc: 0 loss: 1.5082 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6025 data: 0.0756 lr: 2.50e-05 mem: 47% pow: 661.203 W 0: INFO 26-04-29 22:47:56.616631 - 7:12:37 - step: 33210 acc: 0 loss: 1.1915 grad: 1.55e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.602 data: 0.0883 lr: 2.50e-05 mem: 54% pow: 661.303 W 0: INFO 26-04-29 22:48:10.331268 - 7:12:51 - step: 33220 acc: 0 loss: 1.3088 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6034 data: 0.0814 lr: 2.50e-05 mem: 47% pow: 662.396 W 0: INFO 26-04-29 22:48:23.874001 - 7:13:04 - step: 33230 acc: 0 loss: 1.4755 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6257 data: 0.0868 lr: 2.50e-05 mem: 47% pow: 645.257 W 0: INFO 26-04-29 22:48:37.820827 - 7:13:18 - step: 33240 acc: 0 loss: 1.4274 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.613 data: 0.0907 lr: 2.49e-05 mem: 47% pow: 642.494 W 0: INFO 26-04-29 22:48:51.448509 - 7:13:32 - step: 33250 acc: 0 loss: 1.6403 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6017 data: 0.0891 lr: 2.49e-05 mem: 47% pow: 675.979 W 0: INFO 26-04-29 22:49:05.080137 - 7:13:45 - step: 33260 acc: 0 loss: 1.4237 grad: 1.45e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5905 data: 0.0921 lr: 2.49e-05 mem: 47% pow: 668.801 W 0: INFO 26-04-29 22:49:18.580492 - 7:13:59 - step: 33270 acc: 0 loss: 1.1865 grad: 1.43e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.586 data: 0.0896 lr: 2.49e-05 mem: 47% pow: 670.529 W 0: INFO 26-04-29 22:49:32.431539 - 7:14:13 - step: 33280 acc: 0 loss: 1.1882 grad: 1.46e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6031 data: 0.0872 lr: 2.49e-05 mem: 47% pow: 663.779 W 0: INFO 26-04-29 22:49:46.688084 - 7:14:27 - step: 33290 acc: 0 loss: 1.4159 grad: 1.52e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5964 data: 0.0845 lr: 2.49e-05 mem: 47% pow: 658.236 W 0: INFO 26-04-29 22:50:00.360039 - 7:14:41 - step: 33300 acc: 0 loss: 1.649 grad: 1.58e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6054 data: 0.0903 lr: 2.49e-05 mem: 47% pow: 646.645 W 0: INFO 26-04-29 22:50:17.024289 - 7:14:57 - step: 33310 acc: 0 loss: 1.6787 grad: 1.59e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5877 data: 0.0884 lr: 2.48e-05 mem: 54% pow: 668.26 W 0: INFO 26-04-29 22:50:30.560046 - 7:15:11 - step: 33320 acc: 0 loss: 1.4054 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5759 data: 0.1013 lr: 2.48e-05 mem: 47% pow: 656.544 W 0: INFO 26-04-29 22:50:44.489008 - 7:15:25 - step: 33330 acc: 0 loss: 1.5357 grad: 1.53e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6733 data: 0.076 lr: 2.48e-05 mem: 47% pow: 623.058 W 0: INFO 26-04-29 22:50:58.172198 - 7:15:38 - step: 33340 acc: 0 loss: 1.2519 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5994 data: 0.088 lr: 2.48e-05 mem: 47% pow: 666.044 W 0: INFO 26-04-29 22:51:12.123948 - 7:15:52 - step: 33350 acc: 0 loss: 1.4709 grad: 1.42e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6639 data: 0.0724 lr: 2.48e-05 mem: 47% pow: 653.453 W 0: INFO 26-04-29 22:51:25.680316 - 7:16:06 - step: 33360 acc: 0 loss: 1.4352 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6041 data: 0.0929 lr: 2.48e-05 mem: 47% pow: 652.362 W 0: INFO 26-04-29 22:51:39.384428 - 7:16:20 - step: 33370 acc: 0 loss: 1.2705 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.691 data: 0.0908 lr: 2.47e-05 mem: 47% pow: 604.734 W 0: INFO 26-04-29 22:51:52.929460 - 7:16:33 - step: 33380 acc: 0 loss: 1.7078 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.616 data: 0.0717 lr: 2.47e-05 mem: 47% pow: 663.369 W 0: INFO 26-04-29 22:52:06.554774 - 7:16:47 - step: 33390 acc: 0 loss: 1.651 grad: 1.46e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.604 data: 0.0685 lr: 2.47e-05 mem: 47% pow: 676.273 W 0: INFO 26-04-29 22:52:20.048167 - 7:17:00 - step: 33400 acc: 0 loss: 1.4429 grad: 1.58e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5865 data: 0.0934 lr: 2.47e-05 mem: 47% pow: 662.023 W 0: INFO 26-04-29 22:52:36.626113 - 7:17:17 - step: 33410 acc: 0 loss: 1.4436 grad: 1.56e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6117 data: 0.0936 lr: 2.47e-05 mem: 54% pow: 649.542 W 0: INFO 26-04-29 22:52:50.209417 - 7:17:31 - step: 33420 acc: 0 loss: 1.3942 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5983 data: 0.0906 lr: 2.47e-05 mem: 47% pow: 671.077 W 0: INFO 26-04-29 22:53:03.791306 - 7:17:44 - step: 33430 acc: 0 loss: 1.3514 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.612 data: 0.0691 lr: 2.47e-05 mem: 47% pow: 659.723 W 0: INFO 26-04-29 22:53:17.557287 - 7:17:58 - step: 33440 acc: 0 loss: 1.2358 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.594 data: 0.1148 lr: 2.46e-05 mem: 47% pow: 653.02 W 0: INFO 26-04-29 22:53:31.061907 - 7:18:11 - step: 33450 acc: 0 loss: 1.3649 grad: 1.55e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6629 data: 0.0894 lr: 2.46e-05 mem: 47% pow: 629.592 W 0: INFO 26-04-29 22:53:44.624706 - 7:18:25 - step: 33460 acc: 0 loss: 1.5358 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6081 data: 0.0777 lr: 2.46e-05 mem: 47% pow: 668.944 W 0: INFO 26-04-29 22:53:58.261371 - 7:18:39 - step: 33470 acc: 0 loss: 1.4297 grad: 1.50e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5939 data: 0.0845 lr: 2.46e-05 mem: 47% pow: 656.772 W 0: INFO 26-04-29 22:54:11.931987 - 7:18:52 - step: 33480 acc: 0 loss: 1.2326 grad: 1.47e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5813 data: 0.1068 lr: 2.46e-05 mem: 47% pow: 665.811 W 0: INFO 26-04-29 22:54:25.748795 - 7:19:06 - step: 33490 acc: 0 loss: 1.6656 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6451 data: 0.0713 lr: 2.46e-05 mem: 47% pow: 639.568 W 0: INFO 26-04-29 22:54:39.707884 - 7:19:20 - step: 33500 acc: 0 loss: 1.5247 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6051 data: 0.0781 lr: 2.46e-05 mem: 47% pow: 650.547 W 0: INFO 26-04-29 22:54:56.061289 - 7:19:36 - step: 33510 acc: 0 loss: 1.2382 grad: 1.47e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.6088 data: 0.0783 lr: 2.45e-05 mem: 54% pow: 662.175 W 0: INFO 26-04-29 22:55:09.596503 - 7:19:50 - step: 33520 acc: 0 loss: 1.1681 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5969 data: 0.0904 lr: 2.45e-05 mem: 47% pow: 665.752 W 0: INFO 26-04-29 22:55:23.372500 - 7:20:04 - step: 33530 acc: 0 loss: 1.289 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6067 data: 0.0863 lr: 2.45e-05 mem: 47% pow: 658.571 W 0: INFO 26-04-29 22:55:36.925743 - 7:20:17 - step: 33540 acc: 0 loss: 1.3678 grad: 1.49e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6121 data: 0.0877 lr: 2.45e-05 mem: 47% pow: 647.077 W 0: INFO 26-04-29 22:55:50.650834 - 7:20:31 - step: 33550 acc: 0 loss: 1.4398 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6128 data: 0.0705 lr: 2.45e-05 mem: 47% pow: 666.453 W 0: INFO 26-04-29 22:56:04.295337 - 7:20:45 - step: 33560 acc: 0 loss: 1.328 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5859 data: 0.0868 lr: 2.45e-05 mem: 47% pow: 671.99 W 0: INFO 26-04-29 22:56:18.042612 - 7:20:58 - step: 33570 acc: 0 loss: 1.3995 grad: 1.54e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5975 data: 0.0881 lr: 2.44e-05 mem: 47% pow: 665.577 W 0: INFO 26-04-29 22:56:31.791858 - 7:21:12 - step: 33580 acc: 0 loss: 1.3669 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.58 data: 0.0877 lr: 2.44e-05 mem: 47% pow: 676.167 W 0: INFO 26-04-29 22:56:45.493242 - 7:21:26 - step: 33590 acc: 0 loss: 1.3983 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6045 data: 0.0864 lr: 2.44e-05 mem: 47% pow: 655.647 W 0: INFO 26-04-29 22:56:59.226281 - 7:21:40 - step: 33600 acc: 0 loss: 1.3949 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7149 data: 0.0846 lr: 2.44e-05 mem: 47% pow: 595.948 W 0: INFO 26-04-29 22:57:15.896428 - 7:21:56 - step: 33610 acc: 0 loss: 1.4389 grad: 1.51e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6089 data: 0.089 lr: 2.44e-05 mem: 54% pow: 651.337 W 0: INFO 26-04-29 22:57:29.612965 - 7:22:10 - step: 33620 acc: 0 loss: 1.249 grad: 1.43e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6134 data: 0.0784 lr: 2.44e-05 mem: 47% pow: 658.498 W 0: INFO 26-04-29 22:57:42.962156 - 7:22:23 - step: 33630 acc: 0 loss: 1.3541 grad: 1.51e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5811 data: 0.0922 lr: 2.44e-05 mem: 47% pow: 662.449 W 0: INFO 26-04-29 22:57:56.480247 - 7:22:37 - step: 33640 acc: 0 loss: 1.3947 grad: 1.61e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5952 data: 0.0786 lr: 2.43e-05 mem: 47% pow: 659.563 W 0: INFO 26-04-29 22:58:10.302197 - 7:22:51 - step: 33650 acc: 0 loss: 1.1342 grad: 1.46e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6053 data: 0.0759 lr: 2.43e-05 mem: 47% pow: 662.337 W 0: INFO 26-04-29 22:58:23.905441 - 7:23:04 - step: 33660 acc: 0 loss: 1.0977 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5914 data: 0.085 lr: 2.43e-05 mem: 47% pow: 661.935 W 0: INFO 26-04-29 22:58:37.475399 - 7:23:18 - step: 33670 acc: 0 loss: 1.3087 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6418 data: 0.0866 lr: 2.43e-05 mem: 47% pow: 638.065 W 0: INFO 26-04-29 22:58:51.702490 - 7:23:32 - step: 33680 acc: 0 loss: 1.2007 grad: 1.46e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.585 data: 0.094 lr: 2.43e-05 mem: 47% pow: 662.877 W 0: INFO 26-04-29 22:59:05.172644 - 7:23:45 - step: 33690 acc: 0 loss: 1.5624 grad: 1.53e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6266 data: 0.0575 lr: 2.43e-05 mem: 47% pow: 678.59 W 0: INFO 26-04-29 22:59:18.766605 - 7:23:59 - step: 33700 acc: 0 loss: 1.3282 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6661 data: 0.0976 lr: 2.43e-05 mem: 47% pow: 613.24 W 0: INFO 26-04-29 22:59:35.562236 - 7:24:16 - step: 33710 acc: 0 loss: 1.4545 grad: 1.46e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5872 data: 0.094 lr: 2.42e-05 mem: 54% pow: 661.741 W 0: INFO 26-04-29 22:59:49.110110 - 7:24:29 - step: 33720 acc: 0 loss: 1.3889 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.583 data: 0.098 lr: 2.42e-05 mem: 47% pow: 675.096 W 0: INFO 26-04-29 23:00:02.949062 - 7:24:43 - step: 33730 acc: 0 loss: 1.71 grad: 1.58e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5824 data: 0.1226 lr: 2.42e-05 mem: 47% pow: 656.32 W 0: INFO 26-04-29 23:00:16.698421 - 7:24:57 - step: 33740 acc: 0 loss: 1.4244 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6228 data: 0.0904 lr: 2.42e-05 mem: 47% pow: 640.465 W 0: INFO 26-04-29 23:00:30.536415 - 7:25:11 - step: 33750 acc: 0 loss: 1.1277 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5954 data: 0.09 lr: 2.42e-05 mem: 47% pow: 669.259 W 0: INFO 26-04-29 23:00:44.168098 - 7:25:24 - step: 33760 acc: 0 loss: 1.2178 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5935 data: 0.0892 lr: 2.42e-05 mem: 47% pow: 663.599 W 0: INFO 26-04-29 23:00:57.871174 - 7:25:38 - step: 33770 acc: 0 loss: 1.6581 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5837 data: 0.086 lr: 2.42e-05 mem: 47% pow: 679.751 W 0: INFO 26-04-29 23:01:11.527213 - 7:25:52 - step: 33780 acc: 0 loss: 1.6192 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6096 data: 0.0914 lr: 2.41e-05 mem: 47% pow: 638.162 W 0: INFO 26-04-29 23:01:25.292058 - 7:26:06 - step: 33790 acc: 0 loss: 1.3837 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6114 data: 0.0897 lr: 2.41e-05 mem: 47% pow: 648.741 W 0: INFO 26-04-29 23:01:38.974006 - 7:26:19 - step: 33800 acc: 0 loss: 1.4026 grad: 1.56e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6263 data: 0.0659 lr: 2.41e-05 mem: 47% pow: 656.919 W 0: INFO 26-04-29 23:01:55.621650 - 7:26:36 - step: 33810 acc: 0 loss: 1.6941 grad: 1.52e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5844 data: 0.0867 lr: 2.41e-05 mem: 54% pow: 671.886 W 0: INFO 26-04-29 23:02:09.180026 - 7:26:49 - step: 33820 acc: 0 loss: 1.2946 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5925 data: 0.0801 lr: 2.41e-05 mem: 47% pow: 668.742 W 0: INFO 26-04-29 23:02:22.996541 - 7:27:03 - step: 33830 acc: 0 loss: 1.1565 grad: 1.49e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6104 data: 0.0805 lr: 2.41e-05 mem: 47% pow: 667.95 W 0: INFO 26-04-29 23:02:36.468169 - 7:27:17 - step: 33840 acc: 0 loss: 1.4796 grad: 1.49e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5863 data: 0.0905 lr: 2.40e-05 mem: 47% pow: 658.359 W 0: INFO 26-04-29 23:02:50.207895 - 7:27:31 - step: 33850 acc: 0 loss: 1.2628 grad: 1.70e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6199 data: 0.0598 lr: 2.40e-05 mem: 47% pow: 658.477 W 0: INFO 26-04-29 23:03:03.953522 - 7:27:44 - step: 33860 acc: 0 loss: 1.4149 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6516 data: 0.0799 lr: 2.40e-05 mem: 47% pow: 639.662 W 0: INFO 26-04-29 23:03:17.705887 - 7:27:58 - step: 33870 acc: 0 loss: 1.5984 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5914 data: 0.0901 lr: 2.40e-05 mem: 47% pow: 662.245 W 0: INFO 26-04-29 23:03:31.535251 - 7:28:12 - step: 33880 acc: 0 loss: 1.3839 grad: 1.51e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5975 data: 0.0839 lr: 2.40e-05 mem: 47% pow: 678.916 W 0: INFO 26-04-29 23:03:45.495763 - 7:28:26 - step: 33890 acc: 0 loss: 1.6051 grad: 1.57e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5874 data: 0.0853 lr: 2.40e-05 mem: 47% pow: 664.586 W 0: INFO 26-04-29 23:03:59.142415 - 7:28:39 - step: 33900 acc: 0 loss: 1.246 grad: 1.63e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5794 data: 0.232 lr: 2.40e-05 mem: 47% pow: 591.518 W 0: INFO 26-04-29 23:04:15.651663 - 7:28:56 - step: 33910 acc: 0 loss: 1.289 grad: 1.46e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6473 data: 0.0747 lr: 2.39e-05 mem: 54% pow: 635.829 W 0: INFO 26-04-29 23:04:29.157608 - 7:29:09 - step: 33920 acc: 0 loss: 1.1842 grad: 1.59e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6089 data: 0.0837 lr: 2.39e-05 mem: 47% pow: 659.874 W 0: INFO 26-04-29 23:04:42.824476 - 7:29:23 - step: 33930 acc: 0 loss: 1.3247 grad: 1.52e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6089 data: 0.0884 lr: 2.39e-05 mem: 47% pow: 646.366 W 0: INFO 26-04-29 23:04:56.669532 - 7:29:37 - step: 33940 acc: 0 loss: 1.5535 grad: 1.55e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6329 data: 0.0864 lr: 2.39e-05 mem: 47% pow: 639.43 W 0: INFO 26-04-29 23:05:10.407360 - 7:29:51 - step: 33950 acc: 0 loss: 1.6595 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5948 data: 0.09 lr: 2.39e-05 mem: 47% pow: 657.428 W 0: INFO 26-04-29 23:05:24.573978 - 7:30:05 - step: 33960 acc: 0 loss: 1.2789 grad: 1.54e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6664 data: 0.1022 lr: 2.39e-05 mem: 47% pow: 619.91 W 0: INFO 26-04-29 23:05:38.149456 - 7:30:18 - step: 33970 acc: 0 loss: 1.2587 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6013 data: 0.0805 lr: 2.39e-05 mem: 47% pow: 663.002 W 0: INFO 26-04-29 23:05:51.843246 - 7:30:32 - step: 33980 acc: 0 loss: 1.0301 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5892 data: 0.0868 lr: 2.38e-05 mem: 47% pow: 662.415 W 0: INFO 26-04-29 23:06:05.493768 - 7:30:46 - step: 33990 acc: 0 loss: 1.227 grad: 1.73e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5957 data: 0.091 lr: 2.38e-05 mem: 47% pow: 674.47 W 0: INFO 26-04-29 23:06:19.059501 - 7:30:59 - step: 34000 acc: 0 loss: 1.304 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5878 data: 0.0862 lr: 2.38e-05 mem: 47% pow: 682.46 W 0: INFO 26-04-29 23:06:22.705217 - 7:31:03 - garbage collection 0: INFO 26-04-29 23:06:37.264772 - 7:31:18 - step: 34010 acc: 0 loss: 1.2445 grad: 1.56e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.764 data: 0.0856 lr: 2.38e-05 mem: 54% pow: 571.834 W 0: INFO 26-04-29 23:06:50.991478 - 7:31:31 - step: 34020 acc: 0 loss: 1.5226 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5979 data: 0.082 lr: 2.38e-05 mem: 47% pow: 658.681 W 0: INFO 26-04-29 23:07:05.115102 - 7:31:45 - step: 34030 acc: 0 loss: 1.5561 grad: 1.56e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5861 data: 0.0815 lr: 2.38e-05 mem: 47% pow: 672.866 W 0: INFO 26-04-29 23:07:19.065005 - 7:31:59 - step: 34040 acc: 0 loss: 1.4152 grad: 1.40e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6733 data: 0.0034 lr: 2.37e-05 mem: 47% pow: 660.781 W 0: INFO 26-04-29 23:07:32.709180 - 7:32:13 - step: 34050 acc: 0 loss: 1.4193 grad: 1.49e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6193 data: 0.0857 lr: 2.37e-05 mem: 47% pow: 646.946 W 0: INFO 26-04-29 23:07:46.856945 - 7:32:27 - step: 34060 acc: 0 loss: 1.4746 grad: 1.56e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6221 data: 0.0879 lr: 2.37e-05 mem: 47% pow: 640.424 W 0: INFO 26-04-29 23:08:00.979287 - 7:32:41 - step: 34070 acc: 0 loss: 1.2749 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6234 data: 0.0869 lr: 2.37e-05 mem: 47% pow: 654.091 W 0: INFO 26-04-29 23:08:15.937808 - 7:32:56 - step: 34080 acc: 0 loss: 1.6214 grad: 1.45e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 0.6887 data: 0.0844 lr: 2.37e-05 mem: 47% pow: 604.473 W 0: INFO 26-04-29 23:08:29.898755 - 7:33:10 - step: 34090 acc: 0 loss: 1.3235 grad: 1.60e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.587 data: 0.0887 lr: 2.37e-05 mem: 47% pow: 658.676 W 0: INFO 26-04-29 23:08:44.186360 - 7:33:24 - step: 34100 acc: 0 loss: 1.533 grad: 1.53e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.7282 data: 0.0709 lr: 2.37e-05 mem: 47% pow: 594.684 W 0: INFO 26-04-29 23:09:01.132543 - 7:33:41 - step: 34110 acc: 0 loss: 1.3348 grad: 1.57e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.609 data: 0.0914 lr: 2.36e-05 mem: 54% pow: 647.572 W 0: INFO 26-04-29 23:09:15.201699 - 7:33:55 - step: 34120 acc: 0 loss: 1.5215 grad: 1.53e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.8269 data: 0.0852 lr: 2.36e-05 mem: 47% pow: 534.267 W 0: INFO 26-04-29 23:09:29.137585 - 7:34:09 - step: 34130 acc: 0 loss: 1.436 grad: 1.53e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6045 data: 0.0876 lr: 2.36e-05 mem: 47% pow: 658.068 W 0: INFO 26-04-29 23:09:43.118539 - 7:34:23 - step: 34140 acc: 0 loss: 1.3331 grad: 1.51e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5795 data: 0.0968 lr: 2.36e-05 mem: 47% pow: 662.404 W 0: INFO 26-04-29 23:09:57.134992 - 7:34:37 - step: 34150 acc: 0 loss: 1.5717 grad: 1.44e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6345 data: 0.087 lr: 2.36e-05 mem: 47% pow: 635.821 W 0: INFO 26-04-29 23:10:11.175293 - 7:34:51 - step: 34160 acc: 0 loss: 1.2854 grad: 1.51e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5861 data: 0.0866 lr: 2.36e-05 mem: 47% pow: 677.983 W 0: INFO 26-04-29 23:10:25.181647 - 7:35:05 - step: 34170 acc: 0 loss: 1.1984 grad: 1.53e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6588 data: 0.0811 lr: 2.36e-05 mem: 47% pow: 644.787 W 0: INFO 26-04-29 23:10:38.917903 - 7:35:19 - step: 34180 acc: 0 loss: 1.3985 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6414 data: 0.0893 lr: 2.35e-05 mem: 47% pow: 638.997 W 0: INFO 26-04-29 23:10:52.957982 - 7:35:33 - step: 34190 acc: 0 loss: 1.239 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6188 data: 0.0825 lr: 2.35e-05 mem: 47% pow: 656.045 W 0: INFO 26-04-29 23:11:06.851611 - 7:35:47 - step: 34200 acc: 0 loss: 1.2088 grad: 1.51e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5886 data: 0.1182 lr: 2.35e-05 mem: 47% pow: 651.196 W 0: INFO 26-04-29 23:11:23.290042 - 7:36:04 - step: 34210 acc: 0 loss: 1.2556 grad: 1.56e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.6313 data: 0.0877 lr: 2.35e-05 mem: 54% pow: 645.298 W 0: INFO 26-04-29 23:11:37.595341 - 7:36:18 - step: 34220 acc: 0 loss: 1.1813 grad: 1.63e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5832 data: 0.11 lr: 2.35e-05 mem: 47% pow: 658.391 W 0: INFO 26-04-29 23:11:51.296516 - 7:36:32 - step: 34230 acc: 0 loss: 1.1496 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5886 data: 0.0857 lr: 2.35e-05 mem: 47% pow: 671.995 W 0: INFO 26-04-29 23:12:04.949618 - 7:36:45 - step: 34240 acc: 0 loss: 1.4209 grad: 1.52e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5904 data: 0.0902 lr: 2.35e-05 mem: 47% pow: 664.254 W 0: INFO 26-04-29 23:12:18.872509 - 7:36:59 - step: 34250 acc: 0 loss: 1.2369 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6332 data: 0.0913 lr: 2.34e-05 mem: 47% pow: 637.122 W 0: INFO 26-04-29 23:12:32.739380 - 7:37:13 - step: 34260 acc: 0 loss: 1.505 grad: 1.43e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6756 data: 0.0748 lr: 2.34e-05 mem: 47% pow: 621.348 W 0: INFO 26-04-29 23:12:46.574837 - 7:37:27 - step: 34270 acc: 0 loss: 1.2619 grad: 1.46e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7089 data: 0.0833 lr: 2.34e-05 mem: 47% pow: 601.481 W 0: INFO 26-04-29 23:13:00.361766 - 7:37:41 - step: 34280 acc: 0 loss: 1.4091 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6016 data: 0.0885 lr: 2.34e-05 mem: 47% pow: 665.457 W 0: INFO 26-04-29 23:13:14.562217 - 7:37:55 - step: 34290 acc: 0 loss: 1.467 grad: 1.48e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6187 data: 0.0776 lr: 2.34e-05 mem: 47% pow: 647.554 W 0: INFO 26-04-29 23:13:28.596687 - 7:38:09 - step: 34300 acc: 0 loss: 1.1863 grad: 1.64e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6989 data: 0.0666 lr: 2.34e-05 mem: 47% pow: 616.8 W 0: INFO 26-04-29 23:13:45.917727 - 7:38:26 - step: 34310 acc: 0 loss: 1.5059 grad: 1.55e-01 flops: 3.26e+14 wps: 3.79e+04 iter: 0.6962 data: 0.0739 lr: 2.33e-05 mem: 54% pow: 614.884 W 0: INFO 26-04-29 23:13:59.550339 - 7:38:40 - step: 34320 acc: 0 loss: 1.133 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5782 data: 0.1222 lr: 2.33e-05 mem: 47% pow: 654.674 W 0: INFO 26-04-29 23:14:13.360082 - 7:38:54 - step: 34330 acc: 0 loss: 1.3917 grad: 1.56e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6419 data: 0.0881 lr: 2.33e-05 mem: 47% pow: 639.303 W 0: INFO 26-04-29 23:14:27.631323 - 7:39:08 - step: 34340 acc: 0 loss: 1.8445 grad: 1.51e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6163 data: 0.0914 lr: 2.33e-05 mem: 47% pow: 647.385 W 0: INFO 26-04-29 23:14:41.499570 - 7:39:22 - step: 34350 acc: 0 loss: 1.4966 grad: 1.55e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5957 data: 0.0944 lr: 2.33e-05 mem: 47% pow: 673.537 W 0: INFO 26-04-29 23:14:55.637929 - 7:39:36 - step: 34360 acc: 0 loss: 1.5187 grad: 1.53e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6097 data: 0.0834 lr: 2.33e-05 mem: 47% pow: 663.061 W 0: INFO 26-04-29 23:15:09.129547 - 7:39:49 - step: 34370 acc: 0 loss: 1.5837 grad: 1.52e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6228 data: 0.0782 lr: 2.33e-05 mem: 47% pow: 654.48 W 0: INFO 26-04-29 23:15:23.442985 - 7:40:04 - step: 34380 acc: 0 loss: 1.131 grad: 1.47e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6121 data: 0.0847 lr: 2.32e-05 mem: 47% pow: 651.933 W 0: INFO 26-04-29 23:15:37.373996 - 7:40:18 - step: 34390 acc: 0 loss: 1.2172 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5916 data: 0.0902 lr: 2.32e-05 mem: 47% pow: 663.397 W 0: INFO 26-04-29 23:15:51.265670 - 7:40:32 - step: 34400 acc: 0 loss: 1.667 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5938 data: 0.0882 lr: 2.32e-05 mem: 47% pow: 664.301 W 0: INFO 26-04-29 23:16:08.094003 - 7:40:48 - step: 34410 acc: 0 loss: 1.4358 grad: 1.50e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5865 data: 0.0938 lr: 2.32e-05 mem: 54% pow: 662.227 W 0: INFO 26-04-29 23:16:22.155024 - 7:41:02 - step: 34420 acc: 0 loss: 1.1686 grad: 1.48e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6127 data: 0.0862 lr: 2.32e-05 mem: 47% pow: 648.674 W 0: INFO 26-04-29 23:16:36.185439 - 7:41:16 - step: 34430 acc: 0 loss: 1.5367 grad: 1.47e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6487 data: 0.0881 lr: 2.32e-05 mem: 47% pow: 624.138 W 0: INFO 26-04-29 23:16:49.934772 - 7:41:30 - step: 34440 acc: 0 loss: 1.2595 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7171 data: 0.0899 lr: 2.32e-05 mem: 47% pow: 601.447 W 0: INFO 26-04-29 23:17:04.088416 - 7:41:44 - step: 34450 acc: 0 loss: 1.529 grad: 1.52e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6225 data: 0.063 lr: 2.31e-05 mem: 47% pow: 660.248 W 0: INFO 26-04-29 23:17:18.096216 - 7:41:58 - step: 34460 acc: 0 loss: 1.5016 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6391 data: 0.0477 lr: 2.31e-05 mem: 47% pow: 661.246 W 0: INFO 26-04-29 23:17:31.817710 - 7:42:12 - step: 34470 acc: 0 loss: 1.5633 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6087 data: 0.0807 lr: 2.31e-05 mem: 47% pow: 658.503 W 0: INFO 26-04-29 23:17:45.334705 - 7:42:26 - step: 34480 acc: 0 loss: 1.6195 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6193 data: 0.0863 lr: 2.31e-05 mem: 47% pow: 654.533 W 0: INFO 26-04-29 23:17:59.313155 - 7:42:40 - step: 34490 acc: 0 loss: 1.7493 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5799 data: 0.087 lr: 2.31e-05 mem: 47% pow: 673.944 W 0: INFO 26-04-29 23:18:13.136119 - 7:42:53 - step: 34500 acc: 0 loss: 1.2372 grad: 1.48e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6017 data: 0.087 lr: 2.31e-05 mem: 47% pow: 661.332 W 0: INFO 26-04-29 23:18:29.627651 - 7:43:10 - step: 34510 acc: 0 loss: 1.0093 grad: 1.47e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5903 data: 0.0906 lr: 2.31e-05 mem: 54% pow: 657.894 W 0: INFO 26-04-29 23:18:43.737290 - 7:43:24 - step: 34520 acc: 0 loss: 1.3815 grad: 1.59e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6122 data: 0.0835 lr: 2.30e-05 mem: 47% pow: 652.036 W 0: INFO 26-04-29 23:18:57.729677 - 7:43:38 - step: 34530 acc: 0 loss: 1.6731 grad: 1.62e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5847 data: 0.0974 lr: 2.30e-05 mem: 47% pow: 662.169 W 0: INFO 26-04-29 23:19:11.486701 - 7:43:52 - step: 34540 acc: 0 loss: 1.4126 grad: 1.54e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5912 data: 0.0853 lr: 2.30e-05 mem: 47% pow: 657.04 W 0: INFO 26-04-29 23:19:25.680118 - 7:44:06 - step: 34550 acc: 0 loss: 1.654 grad: 1.53e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6019 data: 0.0843 lr: 2.30e-05 mem: 47% pow: 659.504 W 0: INFO 26-04-29 23:19:39.445086 - 7:44:20 - step: 34560 acc: 0 loss: 1.5491 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6087 data: 0.0802 lr: 2.30e-05 mem: 47% pow: 679.358 W 0: INFO 26-04-29 23:19:53.221012 - 7:44:34 - step: 34570 acc: 0 loss: 1.3674 grad: 1.65e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6328 data: 0.0815 lr: 2.30e-05 mem: 47% pow: 636.165 W 0: INFO 26-04-29 23:20:06.849116 - 7:44:47 - step: 34580 acc: 0 loss: 1.3764 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5979 data: 0.087 lr: 2.29e-05 mem: 47% pow: 666.067 W 0: INFO 26-04-29 23:20:20.633530 - 7:45:01 - step: 34590 acc: 0 loss: 1.6116 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5969 data: 0.0865 lr: 2.29e-05 mem: 47% pow: 670.891 W 0: INFO 26-04-29 23:20:34.336153 - 7:45:15 - step: 34600 acc: 0 loss: 1.2343 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5972 data: 0.0847 lr: 2.29e-05 mem: 47% pow: 660.606 W 0: INFO 26-04-29 23:20:50.853388 - 7:45:31 - step: 34610 acc: 0 loss: 1.2613 grad: 1.47e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.588 data: 0.0897 lr: 2.29e-05 mem: 54% pow: 659.936 W 0: INFO 26-04-29 23:21:04.352280 - 7:45:45 - step: 34620 acc: 0 loss: 1.4639 grad: 1.51e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.58 data: 0.097 lr: 2.29e-05 mem: 47% pow: 659.704 W 0: INFO 26-04-29 23:21:17.873665 - 7:45:58 - step: 34630 acc: 0 loss: 1.5192 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5823 data: 0.088 lr: 2.29e-05 mem: 47% pow: 665.446 W 0: INFO 26-04-29 23:21:31.377535 - 7:46:12 - step: 34640 acc: 0 loss: 1.384 grad: 1.61e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5823 data: 0.0915 lr: 2.29e-05 mem: 47% pow: 669.212 W 0: INFO 26-04-29 23:21:45.255932 - 7:46:26 - step: 34650 acc: 0 loss: 1.3165 grad: 1.47e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.8227 data: 0.0901 lr: 2.28e-05 mem: 47% pow: 530.632 W 0: INFO 26-04-29 23:21:59.067877 - 7:46:39 - step: 34660 acc: 0 loss: 1.0463 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5876 data: 0.088 lr: 2.28e-05 mem: 47% pow: 667.245 W 0: INFO 26-04-29 23:22:12.880434 - 7:46:53 - step: 34670 acc: 0 loss: 1.211 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5941 data: 0.0843 lr: 2.28e-05 mem: 47% pow: 664.8 W 0: INFO 26-04-29 23:22:26.582125 - 7:47:07 - step: 34680 acc: 0 loss: 1.7121 grad: 1.48e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6262 data: 0.0655 lr: 2.28e-05 mem: 47% pow: 657.409 W 0: INFO 26-04-29 23:22:40.422445 - 7:47:21 - step: 34690 acc: 0 loss: 1.4381 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6409 data: 0.0851 lr: 2.28e-05 mem: 47% pow: 647.558 W 0: INFO 26-04-29 23:22:54.196554 - 7:47:34 - step: 34700 acc: 0 loss: 1.7511 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6236 data: 0.0857 lr: 2.28e-05 mem: 47% pow: 646.977 W 0: INFO 26-04-29 23:23:10.885460 - 7:47:51 - step: 34710 acc: 0 loss: 1.333 grad: 1.52e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6038 data: 0.093 lr: 2.28e-05 mem: 54% pow: 655.098 W 0: INFO 26-04-29 23:23:24.434439 - 7:48:05 - step: 34720 acc: 0 loss: 1.7075 grad: 1.61e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6348 data: 0.0549 lr: 2.27e-05 mem: 47% pow: 655.373 W 0: INFO 26-04-29 23:23:38.312764 - 7:48:19 - step: 34730 acc: 0 loss: 1.3885 grad: 1.44e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.62 data: 0.0797 lr: 2.27e-05 mem: 47% pow: 671.196 W 0: INFO 26-04-29 23:23:51.877505 - 7:48:32 - step: 34740 acc: 0 loss: 1.5589 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.604 data: 0.0881 lr: 2.27e-05 mem: 47% pow: 652.474 W 0: INFO 26-04-29 23:24:05.693794 - 7:48:46 - step: 34750 acc: 0 loss: 1.6343 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5953 data: 0.0886 lr: 2.27e-05 mem: 47% pow: 666.915 W 0: INFO 26-04-29 23:24:19.580029 - 7:49:00 - step: 34760 acc: 0 loss: 1.6175 grad: 1.57e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5871 data: 0.0915 lr: 2.27e-05 mem: 47% pow: 670.609 W 0: INFO 26-04-29 23:24:33.158349 - 7:49:13 - step: 34770 acc: 0 loss: 1.732 grad: 1.46e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6532 data: 0.0921 lr: 2.27e-05 mem: 47% pow: 628.936 W 0: INFO 26-04-29 23:24:46.854869 - 7:49:27 - step: 34780 acc: 0 loss: 1.8436 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6707 data: 0.1321 lr: 2.26e-05 mem: 47% pow: 589.398 W 0: INFO 26-04-29 23:25:00.510281 - 7:49:41 - step: 34790 acc: 0 loss: 1.5214 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6082 data: 0.098 lr: 2.26e-05 mem: 47% pow: 650.001 W 0: INFO 26-04-29 23:25:14.219332 - 7:49:55 - step: 34800 acc: 0 loss: 1.4846 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5801 data: 0.1081 lr: 2.26e-05 mem: 47% pow: 654.899 W 0: INFO 26-04-29 23:25:30.903527 - 7:50:11 - step: 34810 acc: 0 loss: 1.5792 grad: 1.50e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6074 data: 0.0907 lr: 2.26e-05 mem: 54% pow: 643.944 W 0: INFO 26-04-29 23:25:44.571341 - 7:50:25 - step: 34820 acc: 0 loss: 1.337 grad: 1.48e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5866 data: 0.0951 lr: 2.26e-05 mem: 47% pow: 667.967 W 0: INFO 26-04-29 23:25:58.438332 - 7:50:39 - step: 34830 acc: 0 loss: 1.4651 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.7278 data: 0.0875 lr: 2.26e-05 mem: 47% pow: 582.043 W 0: INFO 26-04-29 23:26:12.031002 - 7:50:52 - step: 34840 acc: 0 loss: 1.4014 grad: 1.54e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5861 data: 0.0956 lr: 2.26e-05 mem: 47% pow: 668.887 W 0: INFO 26-04-29 23:26:25.775003 - 7:51:06 - step: 34850 acc: 0 loss: 1.2892 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6101 data: 0.0804 lr: 2.25e-05 mem: 47% pow: 659.759 W 0: INFO 26-04-29 23:26:39.422149 - 7:51:20 - step: 34860 acc: 0 loss: 1.2725 grad: 1.54e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5833 data: 0.0894 lr: 2.25e-05 mem: 47% pow: 675.679 W 0: INFO 26-04-29 23:26:53.243283 - 7:51:34 - step: 34870 acc: 0 loss: 1.6129 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6808 data: 0.0698 lr: 2.25e-05 mem: 47% pow: 617.742 W 0: INFO 26-04-29 23:27:07.036000 - 7:51:47 - step: 34880 acc: 0 loss: 1.8691 grad: 1.60e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6452 data: 0.0841 lr: 2.25e-05 mem: 47% pow: 637.949 W 0: INFO 26-04-29 23:27:20.835955 - 7:52:01 - step: 34890 acc: 0 loss: 1.3824 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.631 data: 0.084 lr: 2.25e-05 mem: 47% pow: 642.509 W 0: INFO 26-04-29 23:27:34.532764 - 7:52:15 - step: 34900 acc: 0 loss: 1.3473 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6107 data: 0.0789 lr: 2.25e-05 mem: 47% pow: 663.689 W 0: INFO 26-04-29 23:27:50.936483 - 7:52:31 - step: 34910 acc: 0 loss: 1.218 grad: 1.51e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.6341 data: 0.0928 lr: 2.25e-05 mem: 54% pow: 634.635 W 0: INFO 26-04-29 23:28:04.774483 - 7:52:45 - step: 34920 acc: 0 loss: 1.5057 grad: 1.53e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6668 data: 0.0638 lr: 2.24e-05 mem: 47% pow: 646.79 W 0: INFO 26-04-29 23:28:18.547331 - 7:52:59 - step: 34930 acc: 0 loss: 1.4379 grad: 1.40e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.604 data: 0.0901 lr: 2.24e-05 mem: 47% pow: 667.026 W 0: INFO 26-04-29 23:28:32.059597 - 7:53:12 - step: 34940 acc: 0 loss: 1.488 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5915 data: 0.0845 lr: 2.24e-05 mem: 47% pow: 666.985 W 0: INFO 26-04-29 23:28:45.606438 - 7:53:26 - step: 34950 acc: 0 loss: 1.4996 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6198 data: 0.093 lr: 2.24e-05 mem: 47% pow: 643.437 W 0: INFO 26-04-29 23:28:59.256404 - 7:53:40 - step: 34960 acc: 0 loss: 1.191 grad: 1.43e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5816 data: 0.1393 lr: 2.24e-05 mem: 47% pow: 628.905 W 0: INFO 26-04-29 23:29:12.951681 - 7:53:53 - step: 34970 acc: 0 loss: 1.9247 grad: 1.49e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5968 data: 0.091 lr: 2.24e-05 mem: 47% pow: 667.484 W 0: INFO 26-04-29 23:29:26.680101 - 7:54:07 - step: 34980 acc: 0 loss: 1.6636 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6061 data: 0.0832 lr: 2.24e-05 mem: 47% pow: 658.326 W 0: INFO 26-04-29 23:29:40.757082 - 7:54:21 - step: 34990 acc: 0 loss: 1.4432 grad: 1.50e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6228 data: 0.0906 lr: 2.23e-05 mem: 47% pow: 639.16 W 0: INFO 26-04-29 23:29:54.637396 - 7:54:35 - step: 35000 acc: 0 loss: 1.625 grad: 1.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5946 data: 0.0928 lr: 2.23e-05 mem: 47% pow: 674.983 W 0: INFO 26-04-29 23:29:54.642363 - 7:54:35 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000035000 0: INFO 26-04-29 23:29:54.643012 - 7:54:35 - Saving... 0: INFO 26-04-29 23:30:00.354210 - 7:54:41 - State dict saved! 0: INFO 26-04-29 23:30:00.432529 - 7:54:41 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000035000/train_state_00000.json 0: INFO 26-04-29 23:30:00.436386 - 7:54:41 - Train state saved ! 0: INFO 26-04-29 23:30:00.436592 - 7:54:41 - Cleaning up checkpoints... 0: INFO 26-04-29 23:30:00.436740 - 7:54:41 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000030000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000035000')] 0: INFO 26-04-29 23:30:00.436864 - 7:54:41 - Eval folders: [] 0: INFO 26-04-29 23:30:00.437179 - 7:54:41 - Other folders: [] 0: INFO 26-04-29 23:30:00.437311 - 7:54:41 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000030000')} 0: INFO 26-04-29 23:30:04.514470 - 7:54:45 - garbage collection 0: INFO 26-04-29 23:30:19.331298 - 7:55:00 - step: 35010 acc: 0 loss: 1.0836 grad: 1.47e-01 flops: 2.29e+14 wps: 2.65e+04 iter: 0.5954 data: 0.0918 lr: 2.23e-05 mem: 54% pow: 661.128 W 0: INFO 26-04-29 23:30:33.198385 - 7:55:13 - step: 35020 acc: 0 loss: 1.5775 grad: 1.55e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5969 data: 0.0919 lr: 2.23e-05 mem: 47% pow: 658.595 W 0: INFO 26-04-29 23:30:47.195519 - 7:55:27 - step: 35030 acc: 0 loss: 1.3461 grad: 1.52e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6532 data: 0.0974 lr: 2.23e-05 mem: 47% pow: 618.739 W 0: INFO 26-04-29 23:31:00.926371 - 7:55:41 - step: 35040 acc: 0 loss: 1.3299 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5838 data: 0.0878 lr: 2.23e-05 mem: 47% pow: 667.808 W 0: INFO 26-04-29 23:31:14.951839 - 7:55:55 - step: 35050 acc: 0 loss: 1.3436 grad: 1.45e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5788 data: 0.1476 lr: 2.22e-05 mem: 47% pow: 640.528 W 0: INFO 26-04-29 23:31:29.064093 - 7:56:09 - step: 35060 acc: 0 loss: 1.2885 grad: 1.43e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6174 data: 0.0764 lr: 2.22e-05 mem: 47% pow: 669.455 W 0: INFO 26-04-29 23:31:43.541792 - 7:56:24 - step: 35070 acc: 0 loss: 1.3014 grad: 1.52e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6467 data: 0.088 lr: 2.22e-05 mem: 47% pow: 622.481 W 0: INFO 26-04-29 23:31:57.509287 - 7:56:38 - step: 35080 acc: 0 loss: 1.5063 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6154 data: 0.0874 lr: 2.22e-05 mem: 47% pow: 656.564 W 0: INFO 26-04-29 23:32:11.565090 - 7:56:52 - step: 35090 acc: 0 loss: 1.3603 grad: 1.50e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6085 data: 0.0915 lr: 2.22e-05 mem: 47% pow: 650.984 W 0: INFO 26-04-29 23:32:25.942877 - 7:57:06 - step: 35100 acc: 0 loss: 1.3706 grad: 1.47e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6343 data: 0.0815 lr: 2.22e-05 mem: 47% pow: 641.437 W 0: INFO 26-04-29 23:32:43.279874 - 7:57:24 - step: 35110 acc: 0 loss: 1.533 grad: 1.56e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.5975 data: 0.0831 lr: 2.22e-05 mem: 54% pow: 684.344 W 0: INFO 26-04-29 23:32:57.620621 - 7:57:38 - step: 35120 acc: 0 loss: 1.91 grad: 1.50e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.8631 data: 0.0925 lr: 2.21e-05 mem: 47% pow: 505.449 W 0: INFO 26-04-29 23:33:11.912281 - 7:57:52 - step: 35130 acc: 0 loss: 1.5926 grad: 1.52e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.7248 data: 0.0927 lr: 2.21e-05 mem: 47% pow: 584.026 W 0: INFO 26-04-29 23:33:26.685472 - 7:58:07 - step: 35140 acc: 0 loss: 1.2714 grad: 1.50e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.7634 data: 0.0781 lr: 2.21e-05 mem: 47% pow: 573.026 W 0: INFO 26-04-29 23:33:40.950910 - 7:58:21 - step: 35150 acc: 0 loss: 1.503 grad: 1.50e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6242 data: 0.0957 lr: 2.21e-05 mem: 47% pow: 631.727 W 0: INFO 26-04-29 23:33:55.322903 - 7:58:36 - step: 35160 acc: 0 loss: 1.2589 grad: 1.53e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.783 data: 0.0863 lr: 2.21e-05 mem: 47% pow: 555.776 W 0: INFO 26-04-29 23:34:09.568242 - 7:58:50 - step: 35170 acc: 0 loss: 1.3271 grad: 1.56e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6058 data: 0.0914 lr: 2.21e-05 mem: 47% pow: 649.085 W 0: INFO 26-04-29 23:34:23.884670 - 7:59:04 - step: 35180 acc: 0 loss: 1.2711 grad: 1.47e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5958 data: 0.0991 lr: 2.21e-05 mem: 47% pow: 655.023 W 0: INFO 26-04-29 23:34:37.961624 - 7:59:18 - step: 35190 acc: 0 loss: 1.5585 grad: 1.45e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6091 data: 0.0853 lr: 2.20e-05 mem: 47% pow: 666.038 W 0: INFO 26-04-29 23:34:52.592184 - 7:59:33 - step: 35200 acc: 0 loss: 1.4703 grad: 1.56e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6024 data: 0.1009 lr: 2.20e-05 mem: 47% pow: 654.227 W 0: INFO 26-04-29 23:35:09.941125 - 7:59:50 - step: 35210 acc: 0 loss: 1.134 grad: 1.55e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.6299 data: 0.0765 lr: 2.20e-05 mem: 54% pow: 669.613 W 0: INFO 26-04-29 23:35:24.472329 - 8:00:05 - step: 35220 acc: 0 loss: 1.2551 grad: 1.48e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.598 data: 0.087 lr: 2.20e-05 mem: 47% pow: 659.291 W 0: INFO 26-04-29 23:35:38.713800 - 8:00:19 - step: 35230 acc: 0 loss: 1.5472 grad: 1.49e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.618 data: 0.0877 lr: 2.20e-05 mem: 47% pow: 657.921 W 0: INFO 26-04-29 23:35:52.990089 - 8:00:33 - step: 35240 acc: 0 loss: 1.7532 grad: 1.58e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6795 data: 0.0034 lr: 2.20e-05 mem: 47% pow: 664.693 W 0: INFO 26-04-29 23:36:07.940457 - 8:00:48 - step: 35250 acc: 0 loss: 1.7082 grad: 1.61e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.6018 data: 0.0911 lr: 2.19e-05 mem: 47% pow: 658.942 W 0: INFO 26-04-29 23:36:22.758907 - 8:01:03 - step: 35260 acc: 0 loss: 1.0589 grad: 1.52e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.7649 data: 0.0607 lr: 2.19e-05 mem: 47% pow: 579.295 W 0: INFO 26-04-29 23:36:36.964942 - 8:01:17 - step: 35270 acc: 0 loss: 1.2397 grad: 1.50e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.8141 data: 0.0032 lr: 2.19e-05 mem: 47% pow: 582.037 W 0: INFO 26-04-29 23:36:52.018557 - 8:01:32 - step: 35280 acc: 0 loss: 1.5552 grad: 1.59e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.8133 data: 0.0913 lr: 2.19e-05 mem: 47% pow: 547.171 W 0: INFO 26-04-29 23:37:06.514993 - 8:01:47 - step: 35290 acc: 0 loss: 1.5364 grad: 1.46e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.6237 data: 0.0932 lr: 2.19e-05 mem: 47% pow: 640.825 W 0: INFO 26-04-29 23:37:21.323143 - 8:02:02 - step: 35300 acc: 0 loss: 1.2973 grad: 1.50e-01 flops: 3.81e+14 wps: 4.43e+04 iter: 0.6408 data: 0.0781 lr: 2.19e-05 mem: 47% pow: 640.359 W 0: INFO 26-04-29 23:37:40.269381 - 8:02:21 - step: 35310 acc: 0 loss: 1.4099 grad: 1.52e-01 flops: 2.98e+14 wps: 3.46e+04 iter: 0.6242 data: 0.071 lr: 2.19e-05 mem: 54% pow: 648.74 W 0: INFO 26-04-29 23:37:54.856697 - 8:02:35 - step: 35320 acc: 0 loss: 1.6009 grad: 3.64e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6379 data: 0.088 lr: 2.18e-05 mem: 47% pow: 638.869 W 0: INFO 26-04-29 23:38:09.767346 - 8:02:50 - step: 35330 acc: 0 loss: 1.724 grad: 1.54e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.5834 data: 0.0927 lr: 2.18e-05 mem: 47% pow: 666.219 W 0: INFO 26-04-29 23:38:24.244068 - 8:03:05 - step: 35340 acc: 0 loss: 1.161 grad: 1.48e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6261 data: 0.0949 lr: 2.18e-05 mem: 47% pow: 641.304 W 0: INFO 26-04-29 23:38:39.076769 - 8:03:19 - step: 35350 acc: 0 loss: 1.7944 grad: 1.57e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.617 data: 0.0873 lr: 2.18e-05 mem: 47% pow: 642.555 W 0: INFO 26-04-29 23:38:53.807470 - 8:03:34 - step: 35360 acc: 0 loss: 1.8603 grad: 1.50e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.5917 data: 0.0903 lr: 2.18e-05 mem: 47% pow: 659.342 W 0: INFO 26-04-29 23:39:08.220763 - 8:03:49 - step: 35370 acc: 0 loss: 1.404 grad: 1.47e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6844 data: 0.0875 lr: 2.18e-05 mem: 47% pow: 610.764 W 0: INFO 26-04-29 23:39:22.653305 - 8:04:03 - step: 35380 acc: 0 loss: 1.0662 grad: 1.47e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6694 data: 0.0033 lr: 2.18e-05 mem: 47% pow: 664.277 W 0: INFO 26-04-29 23:39:37.089321 - 8:04:17 - step: 35390 acc: 0 loss: 1.7819 grad: 1.49e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.5933 data: 0.0886 lr: 2.17e-05 mem: 47% pow: 657.147 W 0: INFO 26-04-29 23:39:51.858504 - 8:04:32 - step: 35400 acc: 0 loss: 1.5705 grad: 1.44e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.703 data: 0.089 lr: 2.17e-05 mem: 47% pow: 617.253 W 0: INFO 26-04-29 23:40:09.501801 - 8:04:50 - step: 35410 acc: 0 loss: 1.5216 grad: 1.52e-01 flops: 3.20e+14 wps: 3.72e+04 iter: 0.5827 data: 0.1265 lr: 2.17e-05 mem: 54% pow: 657.845 W 0: INFO 26-04-29 23:40:24.209548 - 8:05:05 - step: 35420 acc: 0 loss: 1.7925 grad: 1.45e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6539 data: 0.0822 lr: 2.17e-05 mem: 47% pow: 622.203 W 0: INFO 26-04-29 23:40:39.288623 - 8:05:20 - step: 35430 acc: 0 loss: 1.4042 grad: 1.53e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.5986 data: 0.0812 lr: 2.17e-05 mem: 47% pow: 658.455 W 0: INFO 26-04-29 23:40:54.229658 - 8:05:35 - step: 35440 acc: 0 loss: 0.9618 grad: 1.51e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.7573 data: 0.0846 lr: 2.17e-05 mem: 47% pow: 567.803 W 0: INFO 26-04-29 23:41:09.048752 - 8:05:49 - step: 35450 acc: 0 loss: 1.3649 grad: 1.48e-01 flops: 3.81e+14 wps: 4.43e+04 iter: 0.724 data: 0.0686 lr: 2.17e-05 mem: 47% pow: 597.897 W 0: INFO 26-04-29 23:41:23.744082 - 8:06:04 - step: 35460 acc: 0 loss: 1.0455 grad: 1.53e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.5877 data: 0.0901 lr: 2.16e-05 mem: 47% pow: 663.677 W 0: INFO 26-04-29 23:41:38.296075 - 8:06:19 - step: 35470 acc: 0 loss: 1.5191 grad: 1.55e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.597 data: 0.0928 lr: 2.16e-05 mem: 47% pow: 651.428 W 0: INFO 26-04-29 23:41:52.848515 - 8:06:33 - step: 35480 acc: 0 loss: 1.3806 grad: 1.54e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.6211 data: 0.0923 lr: 2.16e-05 mem: 47% pow: 652.803 W 0: INFO 26-04-29 23:42:07.637667 - 8:06:48 - step: 35490 acc: 0 loss: 1.2496 grad: 1.47e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.5986 data: 0.0849 lr: 2.16e-05 mem: 47% pow: 689.442 W 0: INFO 26-04-29 23:42:22.224371 - 8:07:03 - step: 35500 acc: 0 loss: 1.2999 grad: 1.48e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.5905 data: 0.0842 lr: 2.16e-05 mem: 47% pow: 666.852 W 0: INFO 26-04-29 23:42:40.140081 - 8:07:20 - step: 35510 acc: 0 loss: 1.1659 grad: 1.53e-01 flops: 3.15e+14 wps: 3.66e+04 iter: 0.7096 data: 0.0623 lr: 2.16e-05 mem: 54% pow: 605.448 W 0: INFO 26-04-29 23:42:54.672260 - 8:07:35 - step: 35520 acc: 0 loss: 1.5026 grad: 1.63e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.6196 data: 0.0761 lr: 2.15e-05 mem: 47% pow: 650.63 W 0: INFO 26-04-29 23:43:09.007433 - 8:07:49 - step: 35530 acc: 0 loss: 1.3964 grad: 1.48e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.58 data: 0.0921 lr: 2.15e-05 mem: 47% pow: 665.235 W 0: INFO 26-04-29 23:43:23.348692 - 8:08:04 - step: 35540 acc: 0 loss: 1.6156 grad: 1.58e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6278 data: 0.0641 lr: 2.15e-05 mem: 47% pow: 660.927 W 0: INFO 26-04-29 23:43:38.038083 - 8:08:18 - step: 35550 acc: 0 loss: 1.3852 grad: 1.56e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6062 data: 0.0838 lr: 2.15e-05 mem: 47% pow: 656.473 W 0: INFO 26-04-29 23:43:52.692843 - 8:08:33 - step: 35560 acc: 0 loss: 1.1673 grad: 1.45e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6361 data: 0.0832 lr: 2.15e-05 mem: 47% pow: 636.767 W 0: INFO 26-04-29 23:44:07.097587 - 8:08:47 - step: 35570 acc: 0 loss: 1.2998 grad: 1.58e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5772 data: 0.1038 lr: 2.15e-05 mem: 47% pow: 664.381 W 0: INFO 26-04-29 23:44:21.620849 - 8:09:02 - step: 35580 acc: 0 loss: 1.3064 grad: 1.53e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.849 data: 0.0742 lr: 2.15e-05 mem: 47% pow: 529.625 W 0: INFO 26-04-29 23:44:35.997226 - 8:09:16 - step: 35590 acc: 0 loss: 1.1411 grad: 1.47e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5813 data: 0.188 lr: 2.14e-05 mem: 47% pow: 619.004 W 0: INFO 26-04-29 23:44:50.373464 - 8:09:31 - step: 35600 acc: 0 loss: 2.1601 grad: 1.46e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6066 data: 0.0707 lr: 2.14e-05 mem: 47% pow: 655.082 W 0: INFO 26-04-29 23:45:07.970106 - 8:09:48 - step: 35610 acc: 0 loss: 1.6011 grad: 1.46e-01 flops: 3.21e+14 wps: 3.73e+04 iter: 0.6697 data: 0.0034 lr: 2.14e-05 mem: 54% pow: 673.007 W 0: INFO 26-04-29 23:45:22.254435 - 8:10:03 - step: 35620 acc: 0 loss: 1.4588 grad: 1.51e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.6003 data: 0.0943 lr: 2.14e-05 mem: 47% pow: 660.56 W 0: INFO 26-04-29 23:45:37.086326 - 8:10:17 - step: 35630 acc: 0 loss: 1.7301 grad: 1.52e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6343 data: 0.0745 lr: 2.14e-05 mem: 47% pow: 650.461 W 0: INFO 26-04-29 23:45:51.557961 - 8:10:32 - step: 35640 acc: 0 loss: 1.5372 grad: 1.45e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.646 data: 0.0953 lr: 2.14e-05 mem: 47% pow: 637.608 W 0: INFO 26-04-29 23:46:06.509064 - 8:10:47 - step: 35650 acc: 0 loss: 1.6737 grad: 1.61e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.6037 data: 0.0853 lr: 2.14e-05 mem: 47% pow: 662.099 W 0: INFO 26-04-29 23:46:21.250096 - 8:11:02 - step: 35660 acc: 0 loss: 1.6597 grad: 1.48e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.5774 data: 0.1234 lr: 2.13e-05 mem: 47% pow: 653.596 W 0: INFO 26-04-29 23:46:35.563723 - 8:11:16 - step: 35670 acc: 0 loss: 1.1346 grad: 1.51e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6307 data: 0.0816 lr: 2.13e-05 mem: 47% pow: 641.04 W 0: INFO 26-04-29 23:46:50.836759 - 8:11:31 - step: 35680 acc: 0 loss: 1.356 grad: 1.48e-01 flops: 3.70e+14 wps: 4.29e+04 iter: 0.6999 data: 0.0746 lr: 2.13e-05 mem: 47% pow: 624.71 W 0: INFO 26-04-29 23:47:05.766293 - 8:11:46 - step: 35690 acc: 0 loss: 1.2806 grad: 1.52e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.5792 data: 0.1023 lr: 2.13e-05 mem: 47% pow: 680.122 W 0: INFO 26-04-29 23:47:20.398504 - 8:12:01 - step: 35700 acc: 0 loss: 0.9659 grad: 1.54e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6795 data: 0.0851 lr: 2.13e-05 mem: 47% pow: 619.304 W 0: INFO 26-04-29 23:47:38.121141 - 8:12:18 - step: 35710 acc: 0 loss: 1.3173 grad: 1.47e-01 flops: 3.19e+14 wps: 3.70e+04 iter: 0.6331 data: 0.094 lr: 2.13e-05 mem: 54% pow: 644.912 W 0: INFO 26-04-29 23:47:52.234435 - 8:12:33 - step: 35720 acc: 0 loss: 1.3034 grad: 1.49e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6092 data: 0.0909 lr: 2.13e-05 mem: 47% pow: 644.788 W 0: INFO 26-04-29 23:48:06.437318 - 8:12:47 - step: 35730 acc: 0 loss: 1.433 grad: 1.46e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6174 data: 0.0985 lr: 2.12e-05 mem: 47% pow: 633.512 W 0: INFO 26-04-29 23:48:20.860825 - 8:13:01 - step: 35740 acc: 0 loss: 1.1385 grad: 1.48e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5993 data: 0.0999 lr: 2.12e-05 mem: 47% pow: 643.592 W 0: INFO 26-04-29 23:48:35.759567 - 8:13:16 - step: 35750 acc: 0 loss: 1.4 grad: 1.46e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.6397 data: 0.0946 lr: 2.12e-05 mem: 47% pow: 626.76 W 0: INFO 26-04-29 23:48:50.470027 - 8:13:31 - step: 35760 acc: 0 loss: 1.6585 grad: 1.50e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.6458 data: 0.0698 lr: 2.12e-05 mem: 47% pow: 641.954 W 0: INFO 26-04-29 23:49:05.009984 - 8:13:45 - step: 35770 acc: 0 loss: 1.5411 grad: 1.56e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.68 data: 0.0754 lr: 2.12e-05 mem: 47% pow: 615.084 W 0: INFO 26-04-29 23:49:19.739443 - 8:14:00 - step: 35780 acc: 0 loss: 1.3765 grad: 1.48e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.9164 data: 0.0036 lr: 2.12e-05 mem: 47% pow: 527.93 W 0: INFO 26-04-29 23:49:34.039468 - 8:14:14 - step: 35790 acc: 0 loss: 1.1267 grad: 1.55e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.616 data: 0.0866 lr: 2.11e-05 mem: 47% pow: 653.298 W 0: INFO 26-04-29 23:49:49.081743 - 8:14:29 - step: 35800 acc: 0 loss: 1.2463 grad: 1.58e-01 flops: 3.75e+14 wps: 4.36e+04 iter: 0.7819 data: 0.0036 lr: 2.11e-05 mem: 47% pow: 605.142 W 0: INFO 26-04-29 23:50:06.699075 - 8:14:47 - step: 35810 acc: 0 loss: 1.2658 grad: 1.57e-01 flops: 3.21e+14 wps: 3.72e+04 iter: 0.5926 data: 0.0857 lr: 2.11e-05 mem: 54% pow: 667.002 W 0: INFO 26-04-29 23:50:21.218198 - 8:15:02 - step: 35820 acc: 0 loss: 1.1229 grad: 1.58e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.7672 data: 0.0842 lr: 2.11e-05 mem: 47% pow: 568.576 W 0: INFO 26-04-29 23:50:36.251288 - 8:15:17 - step: 35830 acc: 0 loss: 1.4883 grad: 1.48e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.6096 data: 0.0888 lr: 2.11e-05 mem: 47% pow: 679.247 W 0: INFO 26-04-29 23:50:51.042880 - 8:15:31 - step: 35840 acc: 0 loss: 1.9363 grad: 1.49e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.5795 data: 0.1069 lr: 2.11e-05 mem: 47% pow: 670.319 W 0: INFO 26-04-29 23:51:05.787244 - 8:15:46 - step: 35850 acc: 0 loss: 1.8919 grad: 1.54e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6209 data: 0.1099 lr: 2.11e-05 mem: 47% pow: 633.076 W 0: INFO 26-04-29 23:51:20.454872 - 8:16:01 - step: 35860 acc: 0 loss: 1.5298 grad: 1.53e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6826 data: 0.0763 lr: 2.10e-05 mem: 47% pow: 622.307 W 0: INFO 26-04-29 23:51:35.318389 - 8:16:16 - step: 35870 acc: 0 loss: 1.613 grad: 1.51e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.5867 data: 0.0956 lr: 2.10e-05 mem: 47% pow: 655.128 W 0: INFO 26-04-29 23:51:49.368395 - 8:16:30 - step: 35880 acc: 0 loss: 1.3445 grad: 1.57e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6962 data: 0.0882 lr: 2.10e-05 mem: 47% pow: 611.259 W 0: INFO 26-04-29 23:52:04.328904 - 8:16:45 - step: 35890 acc: 0 loss: 1.6016 grad: 1.51e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 0.8291 data: 0.0846 lr: 2.10e-05 mem: 47% pow: 536.219 W 0: INFO 26-04-29 23:52:18.585559 - 8:16:59 - step: 35900 acc: 0 loss: 1.5387 grad: 1.48e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6801 data: 0.0689 lr: 2.10e-05 mem: 47% pow: 636.477 W 0: INFO 26-04-29 23:52:35.671536 - 8:17:16 - step: 35910 acc: 0 loss: 1.7106 grad: 1.50e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.5865 data: 0.0902 lr: 2.10e-05 mem: 54% pow: 663.311 W 0: INFO 26-04-29 23:52:50.383775 - 8:17:31 - step: 35920 acc: 0 loss: 1.7136 grad: 1.51e-01 flops: 3.84e+14 wps: 4.46e+04 iter: 0.5967 data: 0.1008 lr: 2.10e-05 mem: 47% pow: 650.473 W 0: INFO 26-04-29 23:53:04.654735 - 8:17:45 - step: 35930 acc: 0 loss: 1.7179 grad: 1.49e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.5946 data: 0.0853 lr: 2.09e-05 mem: 47% pow: 660.787 W 0: INFO 26-04-29 23:53:19.180718 - 8:17:59 - step: 35940 acc: 0 loss: 1.0504 grad: 1.54e-01 flops: 3.89e+14 wps: 4.51e+04 iter: 0.8088 data: 0.055 lr: 2.09e-05 mem: 47% pow: 557.403 W 0: INFO 26-04-29 23:53:33.860655 - 8:18:14 - step: 35950 acc: 0 loss: 1.5347 grad: 1.61e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.7978 data: 0.1494 lr: 2.09e-05 mem: 47% pow: 513.656 W 0: INFO 26-04-29 23:53:48.253795 - 8:18:29 - step: 35960 acc: 0 loss: 1.6787 grad: 1.63e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5865 data: 0.091 lr: 2.09e-05 mem: 47% pow: 663.7 W 0: INFO 26-04-29 23:54:02.766782 - 8:18:43 - step: 35970 acc: 0 loss: 1.2934 grad: 1.59e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.5829 data: 0.0871 lr: 2.09e-05 mem: 47% pow: 673.386 W 0: INFO 26-04-29 23:54:17.240274 - 8:18:58 - step: 35980 acc: 0 loss: 1.4963 grad: 1.53e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.7809 data: 0.0828 lr: 2.09e-05 mem: 47% pow: 565.936 W 0: INFO 26-04-29 23:54:31.817448 - 8:19:12 - step: 35990 acc: 0 loss: 1.3442 grad: 1.71e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.6502 data: 0.0922 lr: 2.08e-05 mem: 47% pow: 635.823 W 0: INFO 26-04-29 23:54:46.192951 - 8:19:26 - step: 36000 acc: 0 loss: 1.3271 grad: 1.43e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6079 data: 0.0873 lr: 2.08e-05 mem: 47% pow: 648.099 W 0: INFO 26-04-29 23:54:49.917421 - 8:19:30 - garbage collection 0: INFO 26-04-29 23:55:04.843825 - 8:19:45 - step: 36010 acc: 0 loss: 1.2302 grad: 1.57e-01 flops: 3.03e+14 wps: 3.51e+04 iter: 0.7597 data: 0.0033 lr: 2.08e-05 mem: 54% pow: 621.487 W 0: INFO 26-04-29 23:55:19.240075 - 8:20:00 - step: 36020 acc: 0 loss: 1.8573 grad: 1.51e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.7381 data: 0.0812 lr: 2.08e-05 mem: 47% pow: 579.307 W 0: INFO 26-04-29 23:55:34.009813 - 8:20:14 - step: 36030 acc: 0 loss: 1.574 grad: 1.54e-01 flops: 3.82e+14 wps: 4.44e+04 iter: 0.6507 data: 0.0826 lr: 2.08e-05 mem: 47% pow: 636.571 W 0: INFO 26-04-29 23:55:48.857225 - 8:20:29 - step: 36040 acc: 0 loss: 1.3174 grad: 1.46e-01 flops: 3.80e+14 wps: 4.42e+04 iter: 0.6311 data: 0.0853 lr: 2.08e-05 mem: 47% pow: 635.698 W 0: INFO 26-04-29 23:56:03.082516 - 8:20:43 - step: 36050 acc: 0 loss: 2.0968 grad: 1.57e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6057 data: 0.0712 lr: 2.08e-05 mem: 47% pow: 667.192 W 0: INFO 26-04-29 23:56:17.921656 - 8:20:58 - step: 36060 acc: 0 loss: 1.247 grad: 1.54e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.8129 data: 0.0881 lr: 2.07e-05 mem: 47% pow: 530.823 W 0: INFO 26-04-29 23:56:32.049299 - 8:21:12 - step: 36070 acc: 0 loss: 1.4138 grad: 1.49e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6096 data: 0.0807 lr: 2.07e-05 mem: 47% pow: 658.407 W 0: INFO 26-04-29 23:56:46.554601 - 8:21:27 - step: 36080 acc: 0 loss: 1.4656 grad: 1.49e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.6978 data: 0.083 lr: 2.07e-05 mem: 47% pow: 608.887 W 0: INFO 26-04-29 23:57:00.865578 - 8:21:41 - step: 36090 acc: 0 loss: 1.2683 grad: 1.47e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5842 data: 0.0976 lr: 2.07e-05 mem: 47% pow: 685.958 W 0: INFO 26-04-29 23:57:15.377006 - 8:21:56 - step: 36100 acc: 0 loss: 1.3592 grad: 1.52e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.6994 data: 0.0801 lr: 2.07e-05 mem: 47% pow: 602.561 W 0: INFO 26-04-29 23:57:33.168617 - 8:22:13 - step: 36110 acc: 0 loss: 1.4981 grad: 1.53e-01 flops: 3.17e+14 wps: 3.68e+04 iter: 0.6126 data: 0.0762 lr: 2.07e-05 mem: 54% pow: 655.719 W 0: INFO 26-04-29 23:57:47.442442 - 8:22:28 - step: 36120 acc: 0 loss: 1.6571 grad: 1.51e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.8558 data: 0.0817 lr: 2.07e-05 mem: 47% pow: 514.495 W 0: INFO 26-04-29 23:58:01.616182 - 8:22:42 - step: 36130 acc: 0 loss: 1.2958 grad: 1.50e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7152 data: 0.0767 lr: 2.06e-05 mem: 47% pow: 604.842 W 0: INFO 26-04-29 23:58:16.351926 - 8:22:57 - step: 36140 acc: 0 loss: 1.6421 grad: 1.52e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.6474 data: 0.0851 lr: 2.06e-05 mem: 47% pow: 632.059 W 0: INFO 26-04-29 23:58:31.466140 - 8:23:12 - step: 36150 acc: 0 loss: 1.6318 grad: 1.57e-01 flops: 3.74e+14 wps: 4.34e+04 iter: 0.7215 data: 0.0403 lr: 2.06e-05 mem: 47% pow: 618.517 W 0: INFO 26-04-29 23:58:46.015070 - 8:23:26 - step: 36160 acc: 0 loss: 1.3464 grad: 1.52e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.6224 data: 0.0933 lr: 2.06e-05 mem: 47% pow: 638.584 W 0: INFO 26-04-29 23:59:00.388177 - 8:23:41 - step: 36170 acc: 0 loss: 1.2817 grad: 1.46e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6051 data: 0.0827 lr: 2.06e-05 mem: 47% pow: 656.835 W 0: INFO 26-04-29 23:59:15.575437 - 8:23:56 - step: 36180 acc: 0 loss: 1.0291 grad: 1.52e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.658 data: 0.0701 lr: 2.06e-05 mem: 47% pow: 633.967 W 0: INFO 26-04-29 23:59:30.495917 - 8:24:11 - step: 36190 acc: 0 loss: 1.625 grad: 1.59e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.7016 data: 0.0745 lr: 2.06e-05 mem: 47% pow: 613.711 W 0: INFO 26-04-29 23:59:44.844464 - 8:24:25 - step: 36200 acc: 0 loss: 1.2134 grad: 1.50e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6485 data: 0.0947 lr: 2.05e-05 mem: 47% pow: 623.581 W 0: INFO 26-04-30 00:00:02.356032 - 8:24:43 - step: 36210 acc: 0 loss: 1.3283 grad: 1.49e-01 flops: 3.23e+14 wps: 3.74e+04 iter: 0.6363 data: 0.0543 lr: 2.05e-05 mem: 54% pow: 673.536 W 0: INFO 26-04-30 00:00:16.904034 - 8:24:57 - step: 36220 acc: 0 loss: 1.2439 grad: 1.49e-01 flops: 3.88e+14 wps: 4.51e+04 iter: 0.7455 data: 0.0868 lr: 2.05e-05 mem: 47% pow: 578.26 W 0: INFO 26-04-30 00:00:31.124767 - 8:25:11 - step: 36230 acc: 0 loss: 1.9855 grad: 1.49e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6672 data: 0.0582 lr: 2.05e-05 mem: 47% pow: 641.395 W 0: INFO 26-04-30 00:00:45.929665 - 8:25:26 - step: 36240 acc: 0 loss: 1.3038 grad: 1.53e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6384 data: 0.0812 lr: 2.05e-05 mem: 47% pow: 632.635 W 0: INFO 26-04-30 00:01:00.167521 - 8:25:40 - step: 36250 acc: 0 loss: 1.6078 grad: 1.53e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6131 data: 0.0874 lr: 2.05e-05 mem: 47% pow: 653.224 W 0: INFO 26-04-30 00:01:15.078148 - 8:25:55 - step: 36260 acc: 0 loss: 1.1101 grad: 1.66e-01 flops: 3.79e+14 wps: 4.40e+04 iter: 0.8514 data: 0.0034 lr: 2.04e-05 mem: 47% pow: 568.371 W 0: INFO 26-04-30 00:01:29.293161 - 8:26:10 - step: 36270 acc: 0 loss: 1.2401 grad: 1.69e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6213 data: 0.0916 lr: 2.04e-05 mem: 47% pow: 642.357 W 0: INFO 26-04-30 00:01:43.533427 - 8:26:24 - step: 36280 acc: 0 loss: 1.8139 grad: 1.49e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6824 data: 0.0877 lr: 2.04e-05 mem: 47% pow: 617.579 W 0: INFO 26-04-30 00:01:58.147827 - 8:26:38 - step: 36290 acc: 0 loss: 1.4169 grad: 1.48e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6005 data: 0.084 lr: 2.04e-05 mem: 47% pow: 670.998 W 0: INFO 26-04-30 00:02:12.513525 - 8:26:53 - step: 36300 acc: 0 loss: 1.4749 grad: 1.51e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6239 data: 0.0685 lr: 2.04e-05 mem: 47% pow: 650.012 W 0: INFO 26-04-30 00:02:30.237814 - 8:27:11 - step: 36310 acc: 0 loss: 1.8644 grad: 1.52e-01 flops: 3.19e+14 wps: 3.70e+04 iter: 0.6534 data: 0.0845 lr: 2.04e-05 mem: 54% pow: 619.701 W 0: INFO 26-04-30 00:02:45.666427 - 8:27:26 - step: 36320 acc: 0 loss: 1.1775 grad: 1.55e-01 flops: 3.66e+14 wps: 4.25e+04 iter: 0.6138 data: 0.082 lr: 2.04e-05 mem: 47% pow: 650.757 W 0: INFO 26-04-30 00:03:00.408396 - 8:27:41 - step: 36330 acc: 0 loss: 1.6757 grad: 1.50e-01 flops: 3.83e+14 wps: 4.45e+04 iter: 0.5988 data: 0.0897 lr: 2.03e-05 mem: 47% pow: 657.874 W 0: INFO 26-04-30 00:03:14.363230 - 8:27:55 - step: 36340 acc: 0 loss: 1.5454 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6057 data: 0.0916 lr: 2.03e-05 mem: 47% pow: 654.141 W 0: INFO 26-04-30 00:03:29.046520 - 8:28:09 - step: 36350 acc: 0 loss: 1.2016 grad: 1.50e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.7428 data: 0.0915 lr: 2.03e-05 mem: 47% pow: 576.758 W 0: INFO 26-04-30 00:03:43.806961 - 8:28:24 - step: 36360 acc: 0 loss: 1.4117 grad: 1.51e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.687 data: 0.0589 lr: 2.03e-05 mem: 47% pow: 627.997 W 0: INFO 26-04-30 00:03:58.451447 - 8:28:39 - step: 36370 acc: 0 loss: 1.3002 grad: 1.59e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.6179 data: 0.0881 lr: 2.03e-05 mem: 47% pow: 649.139 W 0: INFO 26-04-30 00:04:12.716526 - 8:28:53 - step: 36380 acc: 0 loss: 1.489 grad: 1.58e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.8109 data: 0.0358 lr: 2.03e-05 mem: 47% pow: 578.695 W 0: INFO 26-04-30 00:04:27.352902 - 8:29:08 - step: 36390 acc: 0 loss: 1.5177 grad: 1.48e-01 flops: 3.86e+14 wps: 4.48e+04 iter: 0.608 data: 0.0823 lr: 2.03e-05 mem: 47% pow: 661.453 W 0: INFO 26-04-30 00:04:41.791032 - 8:29:22 - step: 36400 acc: 0 loss: 1.1973 grad: 1.60e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6471 data: 0.0819 lr: 2.02e-05 mem: 47% pow: 634.516 W 0: INFO 26-04-30 00:04:59.052379 - 8:29:39 - step: 36410 acc: 0 loss: 1.6904 grad: 1.63e-01 flops: 3.27e+14 wps: 3.80e+04 iter: 0.6128 data: 0.0876 lr: 2.02e-05 mem: 54% pow: 644.555 W 0: INFO 26-04-30 00:05:13.045320 - 8:29:53 - step: 36420 acc: 0 loss: 1.7075 grad: 1.49e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6165 data: 0.0817 lr: 2.02e-05 mem: 47% pow: 658.788 W 0: INFO 26-04-30 00:05:26.964866 - 8:30:07 - step: 36430 acc: 0 loss: 1.5549 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5914 data: 0.0864 lr: 2.02e-05 mem: 47% pow: 682.707 W 0: INFO 26-04-30 00:05:40.883494 - 8:30:21 - step: 36440 acc: 0 loss: 1.6227 grad: 1.52e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6249 data: 0.089 lr: 2.02e-05 mem: 47% pow: 645.631 W 0: INFO 26-04-30 00:05:55.185877 - 8:30:35 - step: 36450 acc: 0 loss: 1.3371 grad: 1.56e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6116 data: 0.0915 lr: 2.02e-05 mem: 47% pow: 656.197 W 0: INFO 26-04-30 00:06:09.532562 - 8:30:50 - step: 36460 acc: 0 loss: 1.5975 grad: 1.51e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6379 data: 0.0833 lr: 2.01e-05 mem: 47% pow: 653.07 W 0: INFO 26-04-30 00:06:23.620799 - 8:31:04 - step: 36470 acc: 0 loss: 1.5545 grad: 1.51e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.7032 data: 0.0916 lr: 2.01e-05 mem: 47% pow: 605.793 W 0: INFO 26-04-30 00:06:37.741832 - 8:31:18 - step: 36480 acc: 0 loss: 1.2416 grad: 1.48e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.597 data: 0.0913 lr: 2.01e-05 mem: 47% pow: 654.244 W 0: INFO 26-04-30 00:06:51.668841 - 8:31:32 - step: 36490 acc: 0 loss: 1.8045 grad: 1.49e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.7439 data: 0.1038 lr: 2.01e-05 mem: 47% pow: 570.631 W 0: INFO 26-04-30 00:07:05.859893 - 8:31:46 - step: 36500 acc: 0 loss: 1.4926 grad: 1.56e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5865 data: 0.1078 lr: 2.01e-05 mem: 47% pow: 652.544 W 0: INFO 26-04-30 00:07:22.701448 - 8:32:03 - step: 36510 acc: 0 loss: 1.4686 grad: 1.54e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.5784 data: 0.1117 lr: 2.01e-05 mem: 54% pow: 655.551 W 0: INFO 26-04-30 00:07:36.701346 - 8:32:17 - step: 36520 acc: 0 loss: 1.5386 grad: 1.50e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6179 data: 0.0783 lr: 2.01e-05 mem: 47% pow: 644.58 W 0: INFO 26-04-30 00:07:50.745439 - 8:32:31 - step: 36530 acc: 0 loss: 1.3862 grad: 1.53e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.705 data: 0.0867 lr: 2.00e-05 mem: 47% pow: 607.67 W 0: INFO 26-04-30 00:08:05.618731 - 8:32:46 - step: 36540 acc: 0 loss: 1.48 grad: 1.52e-01 flops: 3.80e+14 wps: 4.41e+04 iter: 0.5841 data: 0.0915 lr: 2.00e-05 mem: 47% pow: 661.719 W 0: INFO 26-04-30 00:08:19.259187 - 8:33:00 - step: 36550 acc: 0 loss: 1.6732 grad: 1.49e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5943 data: 0.0831 lr: 2.00e-05 mem: 47% pow: 656.391 W 0: INFO 26-04-30 00:08:33.375943 - 8:33:14 - step: 36560 acc: 0 loss: 1.274 grad: 1.69e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6231 data: 0.0872 lr: 2.00e-05 mem: 47% pow: 649.825 W 0: INFO 26-04-30 00:08:47.352197 - 8:33:28 - step: 36570 acc: 0 loss: 1.302 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7205 data: 0.0563 lr: 2.00e-05 mem: 47% pow: 607.516 W 0: INFO 26-04-30 00:09:01.061644 - 8:33:41 - step: 36580 acc: 0 loss: 1.989 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5879 data: 0.0902 lr: 2.00e-05 mem: 47% pow: 660.802 W 0: INFO 26-04-30 00:09:15.301550 - 8:33:56 - step: 36590 acc: 0 loss: 1.3016 grad: 1.54e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.7322 data: 0.0032 lr: 2.00e-05 mem: 47% pow: 623.32 W 0: INFO 26-04-30 00:09:29.386978 - 8:34:10 - step: 36600 acc: 0 loss: 1.374 grad: 1.57e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6224 data: 0.0894 lr: 1.99e-05 mem: 47% pow: 653.876 W 0: INFO 26-04-30 00:09:46.862499 - 8:34:27 - step: 36610 acc: 0 loss: 1.4448 grad: 1.55e-01 flops: 3.23e+14 wps: 3.75e+04 iter: 0.577 data: 0.1184 lr: 1.99e-05 mem: 54% pow: 664.183 W 0: INFO 26-04-30 00:10:00.856498 - 8:34:41 - step: 36620 acc: 0 loss: 1.4614 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5945 data: 0.0898 lr: 1.99e-05 mem: 47% pow: 662.209 W 0: INFO 26-04-30 00:10:14.650150 - 8:34:55 - step: 36630 acc: 0 loss: 1.3984 grad: 1.54e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6 data: 0.1268 lr: 1.99e-05 mem: 47% pow: 640.848 W 0: INFO 26-04-30 00:10:28.947090 - 8:35:09 - step: 36640 acc: 0 loss: 1.3819 grad: 1.62e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6311 data: 0.0734 lr: 1.99e-05 mem: 47% pow: 652.716 W 0: INFO 26-04-30 00:10:42.897907 - 8:35:23 - step: 36650 acc: 0 loss: 1.5295 grad: 1.52e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5793 data: 0.1535 lr: 1.99e-05 mem: 47% pow: 631.967 W 0: INFO 26-04-30 00:10:56.844398 - 8:35:37 - step: 36660 acc: 0 loss: 1.3852 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6141 data: 0.0812 lr: 1.99e-05 mem: 47% pow: 648.258 W 0: INFO 26-04-30 00:11:10.949531 - 8:35:51 - step: 36670 acc: 0 loss: 1.5652 grad: 1.49e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6036 data: 0.0838 lr: 1.98e-05 mem: 47% pow: 655.888 W 0: INFO 26-04-30 00:11:24.781340 - 8:36:05 - step: 36680 acc: 0 loss: 2.0059 grad: 1.52e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6211 data: 0.074 lr: 1.98e-05 mem: 47% pow: 657.746 W 0: INFO 26-04-30 00:11:38.805262 - 8:36:19 - step: 36690 acc: 0 loss: 1.1367 grad: 1.50e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6869 data: 0.0897 lr: 1.98e-05 mem: 47% pow: 612.981 W 0: INFO 26-04-30 00:11:53.383378 - 8:36:34 - step: 36700 acc: 0 loss: 1.1692 grad: 1.50e-01 flops: 3.87e+14 wps: 4.50e+04 iter: 0.5772 data: 0.1215 lr: 1.98e-05 mem: 47% pow: 642.061 W 0: INFO 26-04-30 00:12:09.959904 - 8:36:50 - step: 36710 acc: 0 loss: 1.3069 grad: 1.58e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6162 data: 0.0876 lr: 1.98e-05 mem: 54% pow: 652.746 W 0: INFO 26-04-30 00:12:23.451917 - 8:37:04 - step: 36720 acc: 0 loss: 1.3834 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6012 data: 0.0869 lr: 1.98e-05 mem: 47% pow: 677.399 W 0: INFO 26-04-30 00:12:37.396294 - 8:37:18 - step: 36730 acc: 0 loss: 1.2489 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5809 data: 0.0913 lr: 1.97e-05 mem: 47% pow: 668.884 W 0: INFO 26-04-30 00:12:51.151620 - 8:37:31 - step: 36740 acc: 0 loss: 1.7771 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6049 data: 0.0821 lr: 1.97e-05 mem: 47% pow: 665.538 W 0: INFO 26-04-30 00:13:05.027149 - 8:37:45 - step: 36750 acc: 0 loss: 1.4291 grad: 1.56e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6033 data: 0.0876 lr: 1.97e-05 mem: 47% pow: 662.04 W 0: INFO 26-04-30 00:13:18.700135 - 8:37:59 - step: 36760 acc: 0 loss: 1.5695 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5971 data: 0.079 lr: 1.97e-05 mem: 47% pow: 663.031 W 0: INFO 26-04-30 00:13:32.565221 - 8:38:13 - step: 36770 acc: 0 loss: 2.3246 grad: 1.52e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.609 data: 0.0878 lr: 1.97e-05 mem: 47% pow: 647.137 W 0: INFO 26-04-30 00:13:46.736518 - 8:38:27 - step: 36780 acc: 0 loss: 1.1799 grad: 1.52e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5994 data: 0.0831 lr: 1.97e-05 mem: 47% pow: 661.644 W 0: INFO 26-04-30 00:14:00.515973 - 8:38:41 - step: 36790 acc: 0 loss: 0.9554 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6101 data: 0.061 lr: 1.97e-05 mem: 47% pow: 671.314 W 0: INFO 26-04-30 00:14:14.591634 - 8:38:55 - step: 36800 acc: 0 loss: 1.5792 grad: 1.51e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5782 data: 0.1011 lr: 1.96e-05 mem: 47% pow: 661.733 W 0: INFO 26-04-30 00:14:31.819722 - 8:39:12 - step: 36810 acc: 0 loss: 1.1859 grad: 1.57e-01 flops: 3.28e+14 wps: 3.80e+04 iter: 0.6122 data: 0.0835 lr: 1.96e-05 mem: 54% pow: 654.196 W 0: INFO 26-04-30 00:14:45.807971 - 8:39:26 - step: 36820 acc: 0 loss: 0.9199 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6497 data: 0.0733 lr: 1.96e-05 mem: 47% pow: 638.991 W 0: INFO 26-04-30 00:14:59.752891 - 8:39:40 - step: 36830 acc: 0 loss: 1.5161 grad: 1.52e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7176 data: 0.0908 lr: 1.96e-05 mem: 47% pow: 597.274 W 0: INFO 26-04-30 00:15:13.700501 - 8:39:54 - step: 36840 acc: 0 loss: 1.1069 grad: 1.54e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6198 data: 0.0602 lr: 1.96e-05 mem: 47% pow: 661.098 W 0: INFO 26-04-30 00:15:27.562671 - 8:40:08 - step: 36850 acc: 0 loss: 1.8796 grad: 1.60e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6158 data: 0.0912 lr: 1.96e-05 mem: 47% pow: 653.276 W 0: INFO 26-04-30 00:15:41.251633 - 8:40:22 - step: 36860 acc: 0 loss: 1.8461 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5795 data: 0.088 lr: 1.96e-05 mem: 47% pow: 678.114 W 0: INFO 26-04-30 00:15:55.767174 - 8:40:36 - step: 36870 acc: 0 loss: 1.7212 grad: 2.20e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.792 data: 0.0863 lr: 1.95e-05 mem: 47% pow: 548.874 W 0: INFO 26-04-30 00:16:09.427277 - 8:40:50 - step: 36880 acc: 0 loss: 1.6451 grad: 1.78e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5926 data: 0.0897 lr: 1.95e-05 mem: 47% pow: 654.138 W 0: INFO 26-04-30 00:16:23.238952 - 8:41:04 - step: 36890 acc: 0 loss: 1.6562 grad: 1.74e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5807 data: 0.1491 lr: 1.95e-05 mem: 47% pow: 632.021 W 0: INFO 26-04-30 00:16:37.209457 - 8:41:18 - step: 36900 acc: 0 loss: 1.4649 grad: 1.71e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5975 data: 0.0863 lr: 1.95e-05 mem: 47% pow: 667.008 W 0: INFO 26-04-30 00:16:53.944603 - 8:41:34 - step: 36910 acc: 0 loss: 1.7164 grad: 1.60e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5871 data: 0.0865 lr: 1.95e-05 mem: 54% pow: 663.482 W 0: INFO 26-04-30 00:17:07.776351 - 8:41:48 - step: 36920 acc: 0 loss: 1.6665 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5882 data: 0.0886 lr: 1.95e-05 mem: 47% pow: 657.354 W 0: INFO 26-04-30 00:17:21.458010 - 8:42:02 - step: 36930 acc: 0 loss: 1.5767 grad: 1.61e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5892 data: 0.0858 lr: 1.94e-05 mem: 47% pow: 659.999 W 0: INFO 26-04-30 00:17:35.329550 - 8:42:16 - step: 36940 acc: 0 loss: 1.5575 grad: 1.61e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6902 data: 0.094 lr: 1.94e-05 mem: 47% pow: 603.406 W 0: INFO 26-04-30 00:17:49.134231 - 8:42:29 - step: 36950 acc: 0 loss: 1.7136 grad: 1.64e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6197 data: 0.089 lr: 1.94e-05 mem: 47% pow: 649.061 W 0: INFO 26-04-30 00:18:02.781875 - 8:42:43 - step: 36960 acc: 0 loss: 1.7926 grad: 1.72e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6083 data: 0.0838 lr: 1.94e-05 mem: 47% pow: 664.297 W 0: INFO 26-04-30 00:18:17.070349 - 8:42:57 - step: 36970 acc: 0 loss: 1.526 grad: 1.68e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6 data: 0.0941 lr: 1.94e-05 mem: 47% pow: 648.924 W 0: INFO 26-04-30 00:18:31.315835 - 8:43:12 - step: 36980 acc: 0 loss: 1.3303 grad: 1.64e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6044 data: 0.0774 lr: 1.94e-05 mem: 47% pow: 663.917 W 0: INFO 26-04-30 00:18:45.063806 - 8:43:25 - step: 36990 acc: 0 loss: 1.41 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6139 data: 0.0827 lr: 1.94e-05 mem: 47% pow: 647.782 W 0: INFO 26-04-30 00:18:58.675326 - 8:43:39 - step: 37000 acc: 0 loss: 1.3391 grad: 1.69e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6158 data: 0.0732 lr: 1.93e-05 mem: 47% pow: 663.617 W 0: INFO 26-04-30 00:19:02.417911 - 8:43:43 - garbage collection 0: INFO 26-04-30 00:19:16.846524 - 8:43:57 - step: 37010 acc: 0 loss: 1.4016 grad: 1.65e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.5927 data: 0.0833 lr: 1.93e-05 mem: 54% pow: 664.218 W 0: INFO 26-04-30 00:19:30.652896 - 8:44:11 - step: 37020 acc: 0 loss: 1.6358 grad: 1.62e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6277 data: 0.0808 lr: 1.93e-05 mem: 47% pow: 651.372 W 0: INFO 26-04-30 00:19:44.561623 - 8:44:25 - step: 37030 acc: 0 loss: 1.4989 grad: 1.61e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6601 data: 0.0891 lr: 1.93e-05 mem: 47% pow: 629.542 W 0: INFO 26-04-30 00:19:58.527137 - 8:44:39 - step: 37040 acc: 0 loss: 1.348 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.614 data: 0.0878 lr: 1.93e-05 mem: 47% pow: 654.634 W 0: INFO 26-04-30 00:20:12.227539 - 8:44:53 - step: 37050 acc: 0 loss: 1.6024 grad: 1.68e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5921 data: 0.0847 lr: 1.93e-05 mem: 47% pow: 657.306 W 0: INFO 26-04-30 00:20:26.309636 - 8:45:07 - step: 37060 acc: 0 loss: 1.4607 grad: 1.63e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6442 data: 0.0968 lr: 1.93e-05 mem: 47% pow: 628.0 W 0: INFO 26-04-30 00:20:40.002305 - 8:45:20 - step: 37070 acc: 0 loss: 1.535 grad: 1.60e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.622 data: 0.0861 lr: 1.92e-05 mem: 47% pow: 658.844 W 0: INFO 26-04-30 00:20:53.681975 - 8:45:34 - step: 37080 acc: 0 loss: 1.2792 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5881 data: 0.0891 lr: 1.92e-05 mem: 47% pow: 667.278 W 0: INFO 26-04-30 00:21:07.582334 - 8:45:48 - step: 37090 acc: 0 loss: 1.4484 grad: 1.71e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6855 data: 0.0909 lr: 1.92e-05 mem: 47% pow: 602.231 W 0: INFO 26-04-30 00:21:21.433199 - 8:46:02 - step: 37100 acc: 0 loss: 1.3113 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6314 data: 0.0755 lr: 1.92e-05 mem: 47% pow: 647.211 W 0: INFO 26-04-30 00:21:38.231715 - 8:46:19 - step: 37110 acc: 0 loss: 1.3337 grad: 1.63e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6469 data: 0.1032 lr: 1.92e-05 mem: 54% pow: 619.686 W 0: INFO 26-04-30 00:21:52.537318 - 8:46:33 - step: 37120 acc: 0 loss: 1.4491 grad: 1.59e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6061 data: 0.0879 lr: 1.92e-05 mem: 47% pow: 653.646 W 0: INFO 26-04-30 00:22:06.333435 - 8:46:47 - step: 37130 acc: 0 loss: 1.1935 grad: 1.61e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6026 data: 0.0878 lr: 1.92e-05 mem: 47% pow: 655.23 W 0: INFO 26-04-30 00:22:20.191511 - 8:47:00 - step: 37140 acc: 0 loss: 1.3897 grad: 1.61e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5917 data: 0.0938 lr: 1.91e-05 mem: 47% pow: 662.302 W 0: INFO 26-04-30 00:22:34.333820 - 8:47:15 - step: 37150 acc: 0 loss: 1.8409 grad: 1.59e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6649 data: 0.0718 lr: 1.91e-05 mem: 47% pow: 634.63 W 0: INFO 26-04-30 00:22:48.253930 - 8:47:29 - step: 37160 acc: 0 loss: 1.4599 grad: 1.59e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6269 data: 0.0858 lr: 1.91e-05 mem: 47% pow: 657.782 W 0: INFO 26-04-30 00:23:02.317599 - 8:47:43 - step: 37170 acc: 0 loss: 1.4085 grad: 1.68e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.8479 data: 0.0031 lr: 1.91e-05 mem: 47% pow: 568.141 W 0: INFO 26-04-30 00:23:16.254687 - 8:47:57 - step: 37180 acc: 0 loss: 1.5564 grad: 1.62e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6042 data: 0.0873 lr: 1.91e-05 mem: 47% pow: 651.211 W 0: INFO 26-04-30 00:23:29.893358 - 8:48:10 - step: 37190 acc: 0 loss: 1.9157 grad: 1.65e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6111 data: 0.0769 lr: 1.91e-05 mem: 47% pow: 664.307 W 0: INFO 26-04-30 00:23:43.481438 - 8:48:24 - step: 37200 acc: 0 loss: 1.638 grad: 1.74e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5999 data: 0.0932 lr: 1.90e-05 mem: 47% pow: 651.75 W 0: INFO 26-04-30 00:24:00.267785 - 8:48:41 - step: 37210 acc: 0 loss: 1.4927 grad: 1.68e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5982 data: 0.0886 lr: 1.90e-05 mem: 54% pow: 665.411 W 0: INFO 26-04-30 00:24:13.965401 - 8:48:54 - step: 37220 acc: 0 loss: 1.6875 grad: 1.64e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6406 data: 0.0816 lr: 1.90e-05 mem: 47% pow: 640.444 W 0: INFO 26-04-30 00:24:27.836186 - 8:49:08 - step: 37230 acc: 0 loss: 1.4038 grad: 1.68e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6324 data: 0.0787 lr: 1.90e-05 mem: 47% pow: 658.616 W 0: INFO 26-04-30 00:24:41.513749 - 8:49:22 - step: 37240 acc: 0 loss: 1.3937 grad: 1.60e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5855 data: 0.0871 lr: 1.90e-05 mem: 47% pow: 676.844 W 0: INFO 26-04-30 00:24:56.084779 - 8:49:36 - step: 37250 acc: 0 loss: 1.7015 grad: 1.60e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.5932 data: 0.0839 lr: 1.90e-05 mem: 47% pow: 659.192 W 0: INFO 26-04-30 00:25:10.117689 - 8:49:50 - step: 37260 acc: 0 loss: 1.4836 grad: 1.60e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.5814 data: 0.1087 lr: 1.90e-05 mem: 47% pow: 655.886 W 0: INFO 26-04-30 00:25:24.077536 - 8:50:04 - step: 37270 acc: 0 loss: 1.1424 grad: 1.63e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.69 data: 0.0836 lr: 1.89e-05 mem: 47% pow: 611.819 W 0: INFO 26-04-30 00:25:38.034114 - 8:50:18 - step: 37280 acc: 0 loss: 1.436 grad: 1.75e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6467 data: 0.0859 lr: 1.89e-05 mem: 47% pow: 644.342 W 0: INFO 26-04-30 00:25:51.902404 - 8:50:32 - step: 37290 acc: 0 loss: 1.7141 grad: 1.64e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6111 data: 0.1012 lr: 1.89e-05 mem: 47% pow: 640.46 W 0: INFO 26-04-30 00:26:05.795802 - 8:50:46 - step: 37300 acc: 0 loss: 1.4743 grad: 1.61e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6101 data: 0.0816 lr: 1.89e-05 mem: 47% pow: 662.957 W 0: INFO 26-04-30 00:26:22.573440 - 8:51:03 - step: 37310 acc: 0 loss: 1.4137 grad: 1.69e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5842 data: 0.0875 lr: 1.89e-05 mem: 54% pow: 676.331 W 0: INFO 26-04-30 00:26:36.180772 - 8:51:16 - step: 37320 acc: 0 loss: 1.5537 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5899 data: 0.0868 lr: 1.89e-05 mem: 47% pow: 662.419 W 0: INFO 26-04-30 00:26:49.902738 - 8:51:30 - step: 37330 acc: 0 loss: 1.4842 grad: 1.60e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6036 data: 0.0895 lr: 1.89e-05 mem: 47% pow: 650.783 W 0: INFO 26-04-30 00:27:03.583535 - 8:51:44 - step: 37340 acc: 0 loss: 1.1808 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.61 data: 0.0665 lr: 1.88e-05 mem: 47% pow: 661.064 W 0: INFO 26-04-30 00:27:17.310161 - 8:51:58 - step: 37350 acc: 0 loss: 1.6014 grad: 1.54e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5798 data: 0.0915 lr: 1.88e-05 mem: 47% pow: 674.671 W 0: INFO 26-04-30 00:27:31.066578 - 8:52:11 - step: 37360 acc: 0 loss: 1.3519 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6052 data: 0.0878 lr: 1.88e-05 mem: 47% pow: 655.817 W 0: INFO 26-04-30 00:27:45.274468 - 8:52:26 - step: 37370 acc: 0 loss: 1.6339 grad: 1.56e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6207 data: 0.0677 lr: 1.88e-05 mem: 47% pow: 663.319 W 0: INFO 26-04-30 00:27:59.258576 - 8:52:40 - step: 37380 acc: 0 loss: 1.4318 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6135 data: 0.0814 lr: 1.88e-05 mem: 47% pow: 651.243 W 0: INFO 26-04-30 00:28:13.337682 - 8:52:54 - step: 37390 acc: 0 loss: 1.5274 grad: 1.67e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6115 data: 0.0834 lr: 1.88e-05 mem: 47% pow: 653.355 W 0: INFO 26-04-30 00:28:27.406086 - 8:53:08 - step: 37400 acc: 0 loss: 1.4601 grad: 1.76e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.5991 data: 0.0789 lr: 1.88e-05 mem: 47% pow: 659.862 W 0: INFO 26-04-30 00:28:44.301504 - 8:53:25 - step: 37410 acc: 0 loss: 1.7012 grad: 1.60e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.5795 data: 0.1358 lr: 1.87e-05 mem: 54% pow: 644.634 W 0: INFO 26-04-30 00:28:58.065228 - 8:53:38 - step: 37420 acc: 0 loss: 1.5498 grad: 1.75e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6058 data: 0.0937 lr: 1.87e-05 mem: 47% pow: 645.238 W 0: INFO 26-04-30 00:29:11.823454 - 8:53:52 - step: 37430 acc: 0 loss: 1.4617 grad: 1.69e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5922 data: 0.0854 lr: 1.87e-05 mem: 47% pow: 659.656 W 0: INFO 26-04-30 00:29:25.546839 - 8:54:06 - step: 37440 acc: 0 loss: 1.3264 grad: 1.70e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5995 data: 0.0846 lr: 1.87e-05 mem: 47% pow: 664.75 W 0: INFO 26-04-30 00:29:39.315722 - 8:54:20 - step: 37450 acc: 0 loss: 1.3783 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5959 data: 0.0845 lr: 1.87e-05 mem: 47% pow: 654.486 W 0: INFO 26-04-30 00:29:53.095406 - 8:54:33 - step: 37460 acc: 0 loss: 1.0462 grad: 1.72e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6069 data: 0.0838 lr: 1.87e-05 mem: 47% pow: 654.438 W 0: INFO 26-04-30 00:30:07.164822 - 8:54:47 - step: 37470 acc: 0 loss: 1.7432 grad: 1.81e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5805 data: 0.1625 lr: 1.86e-05 mem: 47% pow: 632.746 W 0: INFO 26-04-30 00:30:21.108502 - 8:55:01 - step: 37480 acc: 0 loss: 1.1061 grad: 1.70e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6172 data: 0.0856 lr: 1.86e-05 mem: 47% pow: 668.936 W 0: INFO 26-04-30 00:30:34.758882 - 8:55:15 - step: 37490 acc: 0 loss: 1.1199 grad: 1.64e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5994 data: 0.0869 lr: 1.86e-05 mem: 47% pow: 658.917 W 0: INFO 26-04-30 00:30:48.376808 - 8:55:29 - step: 37500 acc: 0 loss: 1.6875 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5926 data: 0.0784 lr: 1.86e-05 mem: 47% pow: 667.19 W 0: INFO 26-04-30 00:31:05.178234 - 8:55:45 - step: 37510 acc: 0 loss: 1.3371 grad: 1.66e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.641 data: 0.051 lr: 1.86e-05 mem: 54% pow: 651.651 W 0: INFO 26-04-30 00:31:19.059068 - 8:55:59 - step: 37520 acc: 0 loss: 1.5733 grad: 1.65e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5819 data: 0.0903 lr: 1.86e-05 mem: 47% pow: 673.844 W 0: INFO 26-04-30 00:31:32.867055 - 8:56:13 - step: 37530 acc: 0 loss: 1.2884 grad: 1.59e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5813 data: 0.0863 lr: 1.86e-05 mem: 47% pow: 672.372 W 0: INFO 26-04-30 00:31:46.429535 - 8:56:27 - step: 37540 acc: 0 loss: 1.4774 grad: 1.62e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.668 data: 0.0402 lr: 1.85e-05 mem: 47% pow: 643.329 W 0: INFO 26-04-30 00:32:00.036001 - 8:56:40 - step: 37550 acc: 0 loss: 1.3113 grad: 1.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.615 data: 0.0911 lr: 1.85e-05 mem: 47% pow: 645.654 W 0: INFO 26-04-30 00:32:13.737113 - 8:56:54 - step: 37560 acc: 0 loss: 1.2055 grad: 1.66e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6112 data: 0.0854 lr: 1.85e-05 mem: 47% pow: 642.233 W 0: INFO 26-04-30 00:32:27.445496 - 8:57:08 - step: 37570 acc: 0 loss: 1.2188 grad: 1.75e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6014 data: 0.0849 lr: 1.85e-05 mem: 47% pow: 657.242 W 0: INFO 26-04-30 00:32:40.996190 - 8:57:21 - step: 37580 acc: 0 loss: 1.3521 grad: 1.83e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6304 data: 0.0818 lr: 1.85e-05 mem: 47% pow: 657.595 W 0: INFO 26-04-30 00:32:54.769978 - 8:57:35 - step: 37590 acc: 0 loss: 1.3024 grad: 1.62e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6118 data: 0.0863 lr: 1.85e-05 mem: 47% pow: 654.81 W 0: INFO 26-04-30 00:33:08.321373 - 8:57:49 - step: 37600 acc: 0 loss: 1.3406 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5926 data: 0.0871 lr: 1.85e-05 mem: 47% pow: 660.346 W 0: INFO 26-04-30 00:33:25.162982 - 8:58:05 - step: 37610 acc: 0 loss: 1.5805 grad: 1.63e-01 flops: 3.36e+14 wps: 3.89e+04 iter: 0.6017 data: 0.0897 lr: 1.84e-05 mem: 54% pow: 651.725 W 0: INFO 26-04-30 00:33:38.900222 - 8:58:19 - step: 37620 acc: 0 loss: 1.4506 grad: 1.68e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6091 data: 0.0918 lr: 1.84e-05 mem: 47% pow: 653.923 W 0: INFO 26-04-30 00:33:52.618072 - 8:58:33 - step: 37630 acc: 0 loss: 1.1654 grad: 1.77e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5813 data: 0.0936 lr: 1.84e-05 mem: 47% pow: 662.63 W 0: INFO 26-04-30 00:34:06.476539 - 8:58:47 - step: 37640 acc: 0 loss: 1.5281 grad: 1.61e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6241 data: 0.0774 lr: 1.84e-05 mem: 47% pow: 644.951 W 0: INFO 26-04-30 00:34:20.078215 - 8:59:00 - step: 37650 acc: 0 loss: 1.3089 grad: 1.73e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5793 data: 0.0993 lr: 1.84e-05 mem: 47% pow: 660.331 W 0: INFO 26-04-30 00:34:33.801460 - 8:59:14 - step: 37660 acc: 0 loss: 1.4085 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6331 data: 0.0875 lr: 1.84e-05 mem: 47% pow: 638.693 W 0: INFO 26-04-30 00:34:47.717953 - 8:59:28 - step: 37670 acc: 0 loss: 1.419 grad: 1.62e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6134 data: 0.084 lr: 1.83e-05 mem: 47% pow: 650.43 W 0: INFO 26-04-30 00:35:01.479056 - 8:59:42 - step: 37680 acc: 0 loss: 1.3884 grad: 1.63e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5892 data: 0.0882 lr: 1.83e-05 mem: 47% pow: 661.56 W 0: INFO 26-04-30 00:35:15.246565 - 8:59:56 - step: 37690 acc: 0 loss: 1.3712 grad: 1.61e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5821 data: 0.0991 lr: 1.83e-05 mem: 47% pow: 662.475 W 0: INFO 26-04-30 00:35:30.220187 - 9:00:11 - step: 37700 acc: 0 loss: 1.0763 grad: 1.71e-01 flops: 3.77e+14 wps: 4.38e+04 iter: 0.5951 data: 0.0805 lr: 1.83e-05 mem: 47% pow: 656.178 W 0: INFO 26-04-30 00:35:47.001549 - 9:00:27 - step: 37710 acc: 0 loss: 1.4681 grad: 1.55e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.7042 data: 0.1099 lr: 1.83e-05 mem: 54% pow: 583.013 W 0: INFO 26-04-30 00:36:00.734250 - 9:00:41 - step: 37720 acc: 0 loss: 1.7054 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.63 data: 0.0843 lr: 1.83e-05 mem: 47% pow: 638.496 W 0: INFO 26-04-30 00:36:14.799979 - 9:00:55 - step: 37730 acc: 0 loss: 1.4557 grad: 1.80e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6224 data: 0.0858 lr: 1.83e-05 mem: 47% pow: 643.541 W 0: INFO 26-04-30 00:36:28.543488 - 9:01:09 - step: 37740 acc: 0 loss: 1.3992 grad: 1.69e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6523 data: 0.0907 lr: 1.82e-05 mem: 47% pow: 622.233 W 0: INFO 26-04-30 00:36:42.234491 - 9:01:23 - step: 37750 acc: 0 loss: 1.1228 grad: 1.63e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5819 data: 0.0814 lr: 1.82e-05 mem: 47% pow: 668.961 W 0: INFO 26-04-30 00:36:55.898996 - 9:01:36 - step: 37760 acc: 0 loss: 1.5515 grad: 1.61e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.604 data: 0.0906 lr: 1.82e-05 mem: 47% pow: 664.22 W 0: INFO 26-04-30 00:37:09.465534 - 9:01:50 - step: 37770 acc: 0 loss: 1.4733 grad: 1.62e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6114 data: 0.0874 lr: 1.82e-05 mem: 47% pow: 660.113 W 0: INFO 26-04-30 00:37:23.075420 - 9:02:03 - step: 37780 acc: 0 loss: 1.6051 grad: 1.71e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.605 data: 0.0686 lr: 1.82e-05 mem: 47% pow: 670.503 W 0: INFO 26-04-30 00:37:36.856614 - 9:02:17 - step: 37790 acc: 0 loss: 1.2857 grad: 1.57e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5998 data: 0.087 lr: 1.82e-05 mem: 47% pow: 665.282 W 0: INFO 26-04-30 00:37:50.493624 - 9:02:31 - step: 37800 acc: 0 loss: 1.4849 grad: 1.64e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6362 data: 0.0567 lr: 1.82e-05 mem: 47% pow: 652.19 W 0: INFO 26-04-30 00:38:07.212648 - 9:02:48 - step: 37810 acc: 0 loss: 1.458 grad: 1.64e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5913 data: 0.0816 lr: 1.81e-05 mem: 54% pow: 667.021 W 0: INFO 26-04-30 00:38:20.859722 - 9:03:01 - step: 37820 acc: 0 loss: 1.3086 grad: 1.59e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6049 data: 0.0882 lr: 1.81e-05 mem: 47% pow: 652.685 W 0: INFO 26-04-30 00:38:34.572374 - 9:03:15 - step: 37830 acc: 0 loss: 1.103 grad: 1.65e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5811 data: 0.0915 lr: 1.81e-05 mem: 47% pow: 670.019 W 0: INFO 26-04-30 00:38:48.332165 - 9:03:29 - step: 37840 acc: 0 loss: 1.4198 grad: 1.60e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.5898 data: 0.0796 lr: 1.81e-05 mem: 47% pow: 664.292 W 0: INFO 26-04-30 00:39:02.064308 - 9:03:42 - step: 37850 acc: 0 loss: 1.6591 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6015 data: 0.0806 lr: 1.81e-05 mem: 47% pow: 654.954 W 0: INFO 26-04-30 00:39:15.755706 - 9:03:56 - step: 37860 acc: 0 loss: 1.5304 grad: 1.84e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6167 data: 0.0756 lr: 1.81e-05 mem: 47% pow: 675.523 W 0: INFO 26-04-30 00:39:29.446287 - 9:04:10 - step: 37870 acc: 0 loss: 1.3847 grad: 1.71e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6087 data: 0.093 lr: 1.81e-05 mem: 47% pow: 649.676 W 0: INFO 26-04-30 00:39:43.578460 - 9:04:24 - step: 37880 acc: 0 loss: 1.3189 grad: 1.61e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.653 data: 0.0743 lr: 1.80e-05 mem: 47% pow: 635.037 W 0: INFO 26-04-30 00:39:57.699888 - 9:04:38 - step: 37890 acc: 0 loss: 1.6003 grad: 1.68e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6093 data: 0.0869 lr: 1.80e-05 mem: 47% pow: 653.791 W 0: INFO 26-04-30 00:40:11.409471 - 9:04:52 - step: 37900 acc: 0 loss: 1.5047 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6062 data: 0.0825 lr: 1.80e-05 mem: 47% pow: 661.858 W 0: INFO 26-04-30 00:40:28.313588 - 9:05:09 - step: 37910 acc: 0 loss: 1.4896 grad: 1.58e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6357 data: 0.0603 lr: 1.80e-05 mem: 54% pow: 652.84 W 0: INFO 26-04-30 00:40:41.969733 - 9:05:22 - step: 37920 acc: 0 loss: 1.1572 grad: 1.73e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6113 data: 0.0759 lr: 1.80e-05 mem: 47% pow: 663.713 W 0: INFO 26-04-30 00:40:55.913147 - 9:05:36 - step: 37930 acc: 0 loss: 1.491 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5938 data: 0.0814 lr: 1.80e-05 mem: 47% pow: 678.767 W 0: INFO 26-04-30 00:41:09.525674 - 9:05:50 - step: 37940 acc: 0 loss: 1.1321 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6388 data: 0.0776 lr: 1.79e-05 mem: 47% pow: 635.727 W 0: INFO 26-04-30 00:41:23.517141 - 9:06:04 - step: 37950 acc: 0 loss: 1.2721 grad: 1.57e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6043 data: 0.0757 lr: 1.79e-05 mem: 47% pow: 657.322 W 0: INFO 26-04-30 00:41:37.227134 - 9:06:18 - step: 37960 acc: 0 loss: 1.3575 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5943 data: 0.087 lr: 1.79e-05 mem: 47% pow: 672.137 W 0: INFO 26-04-30 00:41:50.811822 - 9:06:31 - step: 37970 acc: 0 loss: 1.7316 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6167 data: 0.0843 lr: 1.79e-05 mem: 47% pow: 649.285 W 0: INFO 26-04-30 00:42:04.473531 - 9:06:45 - step: 37980 acc: 0 loss: 1.2027 grad: 1.68e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5878 data: 0.1158 lr: 1.79e-05 mem: 47% pow: 650.785 W 0: INFO 26-04-30 00:42:18.276807 - 9:06:59 - step: 37990 acc: 0 loss: 0.9582 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6119 data: 0.1025 lr: 1.79e-05 mem: 47% pow: 635.602 W 0: INFO 26-04-30 00:42:32.228795 - 9:07:13 - step: 38000 acc: 0 loss: 1.6989 grad: 1.67e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5999 data: 0.0981 lr: 1.79e-05 mem: 47% pow: 643.772 W 0: INFO 26-04-30 00:42:35.908322 - 9:07:16 - garbage collection 0: INFO 26-04-30 00:42:50.451689 - 9:07:31 - step: 38010 acc: 0 loss: 1.4177 grad: 1.57e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.5992 data: 0.0906 lr: 1.78e-05 mem: 54% pow: 668.284 W 0: INFO 26-04-30 00:43:04.056513 - 9:07:44 - step: 38020 acc: 0 loss: 1.2489 grad: 1.64e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6068 data: 0.087 lr: 1.78e-05 mem: 47% pow: 647.867 W 0: INFO 26-04-30 00:43:18.043178 - 9:07:58 - step: 38030 acc: 0 loss: 1.3795 grad: 1.64e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7703 data: 0.0826 lr: 1.78e-05 mem: 47% pow: 565.018 W 0: INFO 26-04-30 00:43:31.970472 - 9:08:12 - step: 38040 acc: 0 loss: 0.8956 grad: 1.69e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6211 data: 0.058 lr: 1.78e-05 mem: 47% pow: 658.198 W 0: INFO 26-04-30 00:43:45.916532 - 9:08:26 - step: 38050 acc: 0 loss: 1.388 grad: 1.65e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5891 data: 0.0845 lr: 1.78e-05 mem: 47% pow: 660.954 W 0: INFO 26-04-30 00:43:59.519368 - 9:08:40 - step: 38060 acc: 0 loss: 1.5422 grad: 1.62e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6014 data: 0.091 lr: 1.78e-05 mem: 47% pow: 658.154 W 0: INFO 26-04-30 00:44:13.732337 - 9:08:54 - step: 38070 acc: 0 loss: 1.3856 grad: 1.59e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6272 data: 0.0841 lr: 1.78e-05 mem: 47% pow: 644.652 W 0: INFO 26-04-30 00:44:27.343132 - 9:09:08 - step: 38080 acc: 0 loss: 1.4392 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5973 data: 0.0863 lr: 1.77e-05 mem: 47% pow: 662.736 W 0: INFO 26-04-30 00:44:41.185492 - 9:09:21 - step: 38090 acc: 0 loss: 1.7668 grad: 1.61e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6032 data: 0.072 lr: 1.77e-05 mem: 47% pow: 660.712 W 0: INFO 26-04-30 00:44:55.262755 - 9:09:36 - step: 38100 acc: 0 loss: 1.1614 grad: 1.55e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.675 data: 0.0665 lr: 1.77e-05 mem: 47% pow: 617.831 W 0: INFO 26-04-30 00:45:12.096441 - 9:09:52 - step: 38110 acc: 0 loss: 1.3909 grad: 1.62e-01 flops: 3.36e+14 wps: 3.89e+04 iter: 0.6045 data: 0.0891 lr: 1.77e-05 mem: 54% pow: 656.627 W 0: INFO 26-04-30 00:45:29.244102 - 9:10:10 - step: 38120 acc: 0 loss: 1.4017 grad: 1.63e-01 flops: 3.30e+14 wps: 3.83e+04 iter: 0.6195 data: 0.0702 lr: 1.77e-05 mem: 47% pow: 655.516 W 0: INFO 26-04-30 00:45:44.012912 - 9:10:24 - step: 38130 acc: 0 loss: 1.1963 grad: 1.65e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.5886 data: 0.0943 lr: 1.77e-05 mem: 47% pow: 659.129 W 0: INFO 26-04-30 00:45:57.794590 - 9:10:38 - step: 38140 acc: 0 loss: 1.1279 grad: 1.69e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.579 data: 0.1041 lr: 1.76e-05 mem: 47% pow: 678.211 W 0: INFO 26-04-30 00:46:11.590290 - 9:10:52 - step: 38150 acc: 0 loss: 1.2897 grad: 1.62e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6107 data: 0.0685 lr: 1.76e-05 mem: 47% pow: 662.765 W 0: INFO 26-04-30 00:46:25.401975 - 9:11:06 - step: 38160 acc: 0 loss: 1.5062 grad: 1.66e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5964 data: 0.0828 lr: 1.76e-05 mem: 47% pow: 660.881 W 0: INFO 26-04-30 00:46:39.071983 - 9:11:19 - step: 38170 acc: 0 loss: 1.5558 grad: 1.64e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.607 data: 0.0766 lr: 1.76e-05 mem: 47% pow: 661.421 W 0: INFO 26-04-30 00:46:52.681537 - 9:11:33 - step: 38180 acc: 0 loss: 1.6859 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6269 data: 0.0872 lr: 1.76e-05 mem: 47% pow: 634.341 W 0: INFO 26-04-30 00:47:06.230067 - 9:11:47 - step: 38190 acc: 0 loss: 1.3323 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5984 data: 0.0999 lr: 1.76e-05 mem: 47% pow: 653.063 W 0: INFO 26-04-30 00:47:20.070383 - 9:12:00 - step: 38200 acc: 0 loss: 1.6282 grad: 1.60e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6292 data: 0.0599 lr: 1.76e-05 mem: 47% pow: 653.704 W 0: INFO 26-04-30 00:47:36.723072 - 9:12:17 - step: 38210 acc: 0 loss: 1.3847 grad: 1.76e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6009 data: 0.0751 lr: 1.75e-05 mem: 54% pow: 663.736 W 0: INFO 26-04-30 00:47:50.662652 - 9:12:31 - step: 38220 acc: 0 loss: 1.2596 grad: 1.63e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6941 data: 0.0942 lr: 1.75e-05 mem: 47% pow: 611.63 W 0: INFO 26-04-30 00:48:04.326791 - 9:12:45 - step: 38230 acc: 0 loss: 0.8701 grad: 1.62e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5934 data: 0.0874 lr: 1.75e-05 mem: 47% pow: 656.75 W 0: INFO 26-04-30 00:48:18.240271 - 9:12:59 - step: 38240 acc: 0 loss: 1.294 grad: 1.67e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6298 data: 0.0843 lr: 1.75e-05 mem: 47% pow: 640.614 W 0: INFO 26-04-30 00:48:31.767177 - 9:13:12 - step: 38250 acc: 0 loss: 1.3871 grad: 1.66e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6056 data: 0.0783 lr: 1.75e-05 mem: 47% pow: 667.209 W 0: INFO 26-04-30 00:48:45.871300 - 9:13:26 - step: 38260 acc: 0 loss: 1.6339 grad: 1.64e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6279 data: 0.0708 lr: 1.75e-05 mem: 47% pow: 649.438 W 0: INFO 26-04-30 00:48:59.380354 - 9:13:40 - step: 38270 acc: 0 loss: 1.2232 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5888 data: 0.0887 lr: 1.75e-05 mem: 47% pow: 660.084 W 0: INFO 26-04-30 00:49:13.163779 - 9:13:53 - step: 38280 acc: 0 loss: 1.4233 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6065 data: 0.0835 lr: 1.74e-05 mem: 47% pow: 670.572 W 0: INFO 26-04-30 00:49:26.977395 - 9:14:07 - step: 38290 acc: 0 loss: 1.2795 grad: 1.63e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.603 data: 0.0881 lr: 1.74e-05 mem: 47% pow: 666.456 W 0: INFO 26-04-30 00:49:40.677606 - 9:14:21 - step: 38300 acc: 0 loss: 1.3404 grad: 1.62e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.654 data: 0.078 lr: 1.74e-05 mem: 47% pow: 635.963 W 0: INFO 26-04-30 00:49:57.317494 - 9:14:38 - step: 38310 acc: 0 loss: 1.4379 grad: 1.59e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.5956 data: 0.0886 lr: 1.74e-05 mem: 54% pow: 657.803 W 0: INFO 26-04-30 00:50:11.014197 - 9:14:51 - step: 38320 acc: 0 loss: 1.0504 grad: 1.54e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6167 data: 0.0936 lr: 1.74e-05 mem: 47% pow: 649.256 W 0: INFO 26-04-30 00:50:24.868979 - 9:15:05 - step: 38330 acc: 0 loss: 1.4126 grad: 1.61e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6088 data: 0.0856 lr: 1.74e-05 mem: 47% pow: 650.718 W 0: INFO 26-04-30 00:50:38.912353 - 9:15:19 - step: 38340 acc: 0 loss: 1.1759 grad: 1.67e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6537 data: 0.093 lr: 1.74e-05 mem: 47% pow: 620.045 W 0: INFO 26-04-30 00:50:52.468940 - 9:15:33 - step: 38350 acc: 0 loss: 1.4525 grad: 1.64e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5842 data: 0.0892 lr: 1.73e-05 mem: 47% pow: 664.568 W 0: INFO 26-04-30 00:51:06.293781 - 9:15:47 - step: 38360 acc: 0 loss: 1.3038 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6186 data: 0.0889 lr: 1.73e-05 mem: 47% pow: 650.607 W 0: INFO 26-04-30 00:51:19.994569 - 9:16:00 - step: 38370 acc: 0 loss: 1.3159 grad: 1.65e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5998 data: 0.0878 lr: 1.73e-05 mem: 47% pow: 671.035 W 0: INFO 26-04-30 00:51:33.699732 - 9:16:14 - step: 38380 acc: 0 loss: 1.4248 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5756 data: 0.0997 lr: 1.73e-05 mem: 47% pow: 665.598 W 0: INFO 26-04-30 00:51:47.281526 - 9:16:28 - step: 38390 acc: 0 loss: 1.1444 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6088 data: 0.0823 lr: 1.73e-05 mem: 47% pow: 655.094 W 0: INFO 26-04-30 00:52:01.025826 - 9:16:41 - step: 38400 acc: 0 loss: 1.2279 grad: 1.66e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6152 data: 0.0681 lr: 1.73e-05 mem: 47% pow: 687.411 W 0: INFO 26-04-30 00:52:17.689142 - 9:16:58 - step: 38410 acc: 0 loss: 1.3581 grad: 1.69e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5906 data: 0.0898 lr: 1.72e-05 mem: 54% pow: 666.51 W 0: INFO 26-04-30 00:52:31.295048 - 9:17:12 - step: 38420 acc: 0 loss: 1.5312 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6027 data: 0.0923 lr: 1.72e-05 mem: 47% pow: 653.114 W 0: INFO 26-04-30 00:52:45.045098 - 9:17:25 - step: 38430 acc: 0 loss: 1.338 grad: 1.72e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5944 data: 0.0835 lr: 1.72e-05 mem: 47% pow: 661.698 W 0: INFO 26-04-30 00:52:58.511767 - 9:17:39 - step: 38440 acc: 0 loss: 1.4543 grad: 1.62e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5831 data: 0.1285 lr: 1.72e-05 mem: 47% pow: 638.804 W 0: INFO 26-04-30 00:53:12.301540 - 9:17:53 - step: 38450 acc: 0 loss: 1.2171 grad: 1.72e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6134 data: 0.0792 lr: 1.72e-05 mem: 47% pow: 650.914 W 0: INFO 26-04-30 00:53:25.868282 - 9:18:06 - step: 38460 acc: 0 loss: 1.147 grad: 1.65e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5848 data: 0.0871 lr: 1.72e-05 mem: 47% pow: 668.635 W 0: INFO 26-04-30 00:53:39.735397 - 9:18:20 - step: 38470 acc: 0 loss: 1.5643 grad: 1.69e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6096 data: 0.0748 lr: 1.72e-05 mem: 47% pow: 661.843 W 0: INFO 26-04-30 00:53:53.278488 - 9:18:34 - step: 38480 acc: 0 loss: 1.4692 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5964 data: 0.0881 lr: 1.71e-05 mem: 47% pow: 664.3 W 0: INFO 26-04-30 00:54:06.872776 - 9:18:47 - step: 38490 acc: 0 loss: 1.2548 grad: 1.61e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5876 data: 0.0902 lr: 1.71e-05 mem: 47% pow: 667.332 W 0: INFO 26-04-30 00:54:20.506540 - 9:19:01 - step: 38500 acc: 0 loss: 1.4484 grad: 1.66e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5824 data: 0.0938 lr: 1.71e-05 mem: 47% pow: 653.315 W 0: INFO 26-04-30 00:54:37.046352 - 9:19:17 - step: 38510 acc: 0 loss: 1.289 grad: 1.54e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6079 data: 0.0781 lr: 1.71e-05 mem: 54% pow: 662.478 W 0: INFO 26-04-30 00:54:50.728406 - 9:19:31 - step: 38520 acc: 0 loss: 1.1147 grad: 1.57e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5928 data: 0.0817 lr: 1.71e-05 mem: 47% pow: 660.685 W 0: INFO 26-04-30 00:55:04.442570 - 9:19:45 - step: 38530 acc: 0 loss: 1.3425 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6052 data: 0.091 lr: 1.71e-05 mem: 47% pow: 670.306 W 0: INFO 26-04-30 00:55:18.492321 - 9:19:59 - step: 38540 acc: 0 loss: 1.0462 grad: 1.73e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6293 data: 0.0909 lr: 1.71e-05 mem: 47% pow: 642.595 W 0: INFO 26-04-30 00:55:32.297068 - 9:20:13 - step: 38550 acc: 0 loss: 1.4722 grad: 1.77e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6469 data: 0.0798 lr: 1.70e-05 mem: 47% pow: 635.818 W 0: INFO 26-04-30 00:55:46.053848 - 9:20:26 - step: 38560 acc: 0 loss: 1.5083 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6136 data: 0.0782 lr: 1.70e-05 mem: 47% pow: 663.232 W 0: INFO 26-04-30 00:56:00.180602 - 9:20:40 - step: 38570 acc: 0 loss: 1.3295 grad: 1.54e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5849 data: 0.083 lr: 1.70e-05 mem: 47% pow: 669.826 W 0: INFO 26-04-30 00:56:13.930401 - 9:20:54 - step: 38580 acc: 0 loss: 1.1213 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6419 data: 0.0917 lr: 1.70e-05 mem: 47% pow: 632.051 W 0: INFO 26-04-30 00:56:27.669842 - 9:21:08 - step: 38590 acc: 0 loss: 1.1088 grad: 1.73e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6122 data: 0.0853 lr: 1.70e-05 mem: 47% pow: 644.427 W 0: INFO 26-04-30 00:56:41.493502 - 9:21:22 - step: 38600 acc: 0 loss: 1.5456 grad: 1.52e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.7186 data: 0.0933 lr: 1.70e-05 mem: 47% pow: 592.058 W 0: INFO 26-04-30 00:56:58.366086 - 9:21:39 - step: 38610 acc: 0 loss: 1.2835 grad: 1.56e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.5891 data: 0.1231 lr: 1.69e-05 mem: 54% pow: 642.195 W 0: INFO 26-04-30 00:57:11.958257 - 9:21:52 - step: 38620 acc: 0 loss: 1.4999 grad: 1.64e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.625 data: 0.0911 lr: 1.69e-05 mem: 47% pow: 641.141 W 0: INFO 26-04-30 00:57:25.972774 - 9:22:06 - step: 38630 acc: 0 loss: 1.4303 grad: 1.76e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5784 data: 0.108 lr: 1.69e-05 mem: 47% pow: 664.978 W 0: INFO 26-04-30 00:57:40.206686 - 9:22:21 - step: 38640 acc: 0 loss: 1.3253 grad: 1.63e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6145 data: 0.079 lr: 1.69e-05 mem: 47% pow: 660.778 W 0: INFO 26-04-30 00:57:53.799984 - 9:22:34 - step: 38650 acc: 0 loss: 1.5867 grad: 1.67e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.594 data: 0.0912 lr: 1.69e-05 mem: 47% pow: 664.856 W 0: INFO 26-04-30 00:58:07.354247 - 9:22:48 - step: 38660 acc: 0 loss: 1.0662 grad: 1.74e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5763 data: 0.0999 lr: 1.69e-05 mem: 47% pow: 660.867 W 0: INFO 26-04-30 00:58:21.298181 - 9:23:02 - step: 38670 acc: 0 loss: 1.303 grad: 1.72e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.591 data: 0.0884 lr: 1.69e-05 mem: 47% pow: 657.176 W 0: INFO 26-04-30 00:58:35.591483 - 9:23:16 - step: 38680 acc: 0 loss: 1.425 grad: 1.54e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.6667 data: 0.0903 lr: 1.68e-05 mem: 47% pow: 615.137 W 0: INFO 26-04-30 00:58:49.223944 - 9:23:30 - step: 38690 acc: 0 loss: 1.319 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6088 data: 0.0761 lr: 1.68e-05 mem: 47% pow: 660.501 W 0: INFO 26-04-30 00:59:02.921443 - 9:23:43 - step: 38700 acc: 0 loss: 1.464 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.591 data: 0.0829 lr: 1.68e-05 mem: 47% pow: 665.456 W 0: INFO 26-04-30 00:59:19.462650 - 9:24:00 - step: 38710 acc: 0 loss: 1.3154 grad: 1.72e-01 flops: 3.42e+14 wps: 3.96e+04 iter: 0.6483 data: 0.096 lr: 1.68e-05 mem: 54% pow: 621.752 W 0: INFO 26-04-30 00:59:33.169750 - 9:24:13 - step: 38720 acc: 0 loss: 1.3802 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5889 data: 0.0847 lr: 1.68e-05 mem: 47% pow: 668.357 W 0: INFO 26-04-30 00:59:46.972186 - 9:24:27 - step: 38730 acc: 0 loss: 1.2165 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.7038 data: 0.0861 lr: 1.68e-05 mem: 47% pow: 595.746 W 0: INFO 26-04-30 01:00:00.927484 - 9:24:41 - step: 38740 acc: 0 loss: 1.4161 grad: 1.58e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.642 data: 0.0878 lr: 1.68e-05 mem: 47% pow: 629.765 W 0: INFO 26-04-30 01:00:14.765553 - 9:24:55 - step: 38750 acc: 0 loss: 1.0363 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6286 data: 0.0789 lr: 1.67e-05 mem: 47% pow: 653.4 W 0: INFO 26-04-30 01:00:28.673634 - 9:25:09 - step: 38760 acc: 0 loss: 1.2272 grad: 1.62e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.5815 data: 0.1064 lr: 1.67e-05 mem: 47% pow: 666.479 W 0: INFO 26-04-30 01:00:42.420779 - 9:25:23 - step: 38770 acc: 0 loss: 1.2643 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5986 data: 0.0843 lr: 1.67e-05 mem: 47% pow: 678.208 W 0: INFO 26-04-30 01:00:56.186016 - 9:25:36 - step: 38780 acc: 0 loss: 1.0841 grad: 1.53e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.5963 data: 0.0864 lr: 1.67e-05 mem: 47% pow: 663.425 W 0: INFO 26-04-30 01:01:09.843445 - 9:25:50 - step: 38790 acc: 0 loss: 1.1795 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5973 data: 0.0868 lr: 1.67e-05 mem: 47% pow: 660.194 W 0: INFO 26-04-30 01:01:23.610390 - 9:26:04 - step: 38800 acc: 0 loss: 1.1648 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6075 data: 0.0803 lr: 1.67e-05 mem: 47% pow: 662.464 W 0: INFO 26-04-30 01:01:40.435701 - 9:26:21 - step: 38810 acc: 0 loss: 1.4067 grad: 1.54e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5985 data: 0.0881 lr: 1.67e-05 mem: 54% pow: 679.847 W 0: INFO 26-04-30 01:01:53.947020 - 9:26:34 - step: 38820 acc: 0 loss: 1.2878 grad: 1.62e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6143 data: 0.09 lr: 1.66e-05 mem: 47% pow: 644.691 W 0: INFO 26-04-30 01:02:07.712921 - 9:26:48 - step: 38830 acc: 0 loss: 1.2219 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6025 data: 0.0873 lr: 1.66e-05 mem: 47% pow: 659.232 W 0: INFO 26-04-30 01:02:21.280698 - 9:27:02 - step: 38840 acc: 0 loss: 1.3875 grad: 1.62e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5971 data: 0.087 lr: 1.66e-05 mem: 47% pow: 666.942 W 0: INFO 26-04-30 01:02:35.256504 - 9:27:16 - step: 38850 acc: 0 loss: 1.421 grad: 1.63e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6598 data: 0.0781 lr: 1.66e-05 mem: 47% pow: 623.805 W 0: INFO 26-04-30 01:02:48.782012 - 9:27:29 - step: 38860 acc: 0 loss: 1.3439 grad: 1.71e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6224 data: 0.084 lr: 1.66e-05 mem: 47% pow: 654.317 W 0: INFO 26-04-30 01:03:02.381588 - 9:27:43 - step: 38870 acc: 0 loss: 1.3908 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5895 data: 0.0901 lr: 1.66e-05 mem: 47% pow: 658.818 W 0: INFO 26-04-30 01:03:16.222551 - 9:27:57 - step: 38880 acc: 0 loss: 1.4563 grad: 1.57e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6022 data: 0.0815 lr: 1.65e-05 mem: 47% pow: 680.349 W 0: INFO 26-04-30 01:03:29.918779 - 9:28:10 - step: 38890 acc: 0 loss: 1.0356 grad: 1.54e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6116 data: 0.0838 lr: 1.65e-05 mem: 47% pow: 645.306 W 0: INFO 26-04-30 01:03:43.671846 - 9:28:24 - step: 38900 acc: 0 loss: 1.5247 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6046 data: 0.0897 lr: 1.65e-05 mem: 47% pow: 655.462 W 0: INFO 26-04-30 01:04:00.266617 - 9:28:41 - step: 38910 acc: 0 loss: 1.0191 grad: 1.63e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6035 data: 0.0858 lr: 1.65e-05 mem: 54% pow: 667.688 W 0: INFO 26-04-30 01:04:14.453786 - 9:28:55 - step: 38920 acc: 0 loss: 1.0647 grad: 1.52e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5805 data: 0.128 lr: 1.65e-05 mem: 47% pow: 646.328 W 0: INFO 26-04-30 01:04:28.429390 - 9:29:09 - step: 38930 acc: 0 loss: 1.5178 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.738 data: 0.0032 lr: 1.65e-05 mem: 47% pow: 646.054 W 0: INFO 26-04-30 01:04:42.636419 - 9:29:23 - step: 38940 acc: 0 loss: 1.2448 grad: 1.55e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6033 data: 0.0866 lr: 1.65e-05 mem: 47% pow: 660.198 W 0: INFO 26-04-30 01:04:56.564729 - 9:29:37 - step: 38950 acc: 0 loss: 1.3228 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5948 data: 0.0901 lr: 1.64e-05 mem: 47% pow: 667.353 W 0: INFO 26-04-30 01:05:10.222639 - 9:29:51 - step: 38960 acc: 0 loss: 1.0229 grad: 1.57e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5954 data: 0.0926 lr: 1.64e-05 mem: 47% pow: 658.386 W 0: INFO 26-04-30 01:05:23.851552 - 9:30:04 - step: 38970 acc: 0 loss: 1.0083 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5961 data: 0.0902 lr: 1.64e-05 mem: 47% pow: 671.972 W 0: INFO 26-04-30 01:05:37.483001 - 9:30:18 - step: 38980 acc: 0 loss: 1.5298 grad: 1.75e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6089 data: 0.0844 lr: 1.64e-05 mem: 47% pow: 653.478 W 0: INFO 26-04-30 01:05:51.019758 - 9:30:31 - step: 38990 acc: 0 loss: 1.0778 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6047 data: 0.0881 lr: 1.64e-05 mem: 47% pow: 656.565 W 0: INFO 26-04-30 01:06:04.614719 - 9:30:45 - step: 39000 acc: 0 loss: 1.2263 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5809 data: 0.0922 lr: 1.64e-05 mem: 47% pow: 670.153 W 0: INFO 26-04-30 01:06:08.277128 - 9:30:49 - garbage collection 0: INFO 26-04-30 01:06:22.777682 - 9:31:03 - step: 39010 acc: 0 loss: 1.2312 grad: 1.61e-01 flops: 3.11e+14 wps: 3.61e+04 iter: 0.6057 data: 0.0855 lr: 1.64e-05 mem: 54% pow: 664.172 W 0: INFO 26-04-30 01:06:36.429719 - 9:31:17 - step: 39020 acc: 0 loss: 1.3386 grad: 1.56e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5926 data: 0.0881 lr: 1.63e-05 mem: 47% pow: 658.28 W 0: INFO 26-04-30 01:06:50.238020 - 9:31:31 - step: 39030 acc: 0 loss: 1.2952 grad: 1.49e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6047 data: 0.0861 lr: 1.63e-05 mem: 47% pow: 667.455 W 0: INFO 26-04-30 01:07:03.870062 - 9:31:44 - step: 39040 acc: 0 loss: 1.0596 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6069 data: 0.0825 lr: 1.63e-05 mem: 47% pow: 656.857 W 0: INFO 26-04-30 01:07:17.470743 - 9:31:58 - step: 39050 acc: 0 loss: 1.3254 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5819 data: 0.1319 lr: 1.63e-05 mem: 47% pow: 634.985 W 0: INFO 26-04-30 01:07:31.094244 - 9:32:11 - step: 39060 acc: 0 loss: 1.2589 grad: 1.57e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6011 data: 0.0872 lr: 1.63e-05 mem: 47% pow: 661.16 W 0: INFO 26-04-30 01:07:45.016859 - 9:32:25 - step: 39070 acc: 0 loss: 1.3269 grad: 1.60e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5971 data: 0.0942 lr: 1.63e-05 mem: 47% pow: 663.239 W 0: INFO 26-04-30 01:07:58.613157 - 9:32:39 - step: 39080 acc: 0 loss: 0.9995 grad: 1.70e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6321 data: 0.1207 lr: 1.63e-05 mem: 47% pow: 611.83 W 0: INFO 26-04-30 01:08:12.178313 - 9:32:52 - step: 39090 acc: 0 loss: 1.1997 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6004 data: 0.0877 lr: 1.62e-05 mem: 47% pow: 652.79 W 0: INFO 26-04-30 01:08:26.073423 - 9:33:06 - step: 39100 acc: 0 loss: 1.47 grad: 1.59e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6168 data: 0.0757 lr: 1.62e-05 mem: 47% pow: 649.392 W 0: INFO 26-04-30 01:08:42.858870 - 9:33:23 - step: 39110 acc: 0 loss: 1.137 grad: 1.64e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6809 data: 0.09 lr: 1.62e-05 mem: 54% pow: 610.71 W 0: INFO 26-04-30 01:08:56.641706 - 9:33:37 - step: 39120 acc: 0 loss: 1.5731 grad: 1.58e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5883 data: 0.0895 lr: 1.62e-05 mem: 47% pow: 665.403 W 0: INFO 26-04-30 01:09:10.271044 - 9:33:51 - step: 39130 acc: 0 loss: 1.2136 grad: 1.81e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5967 data: 0.0885 lr: 1.62e-05 mem: 47% pow: 663.177 W 0: INFO 26-04-30 01:09:24.134440 - 9:34:04 - step: 39140 acc: 0 loss: 1.1483 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6341 data: 0.0887 lr: 1.62e-05 mem: 47% pow: 656.199 W 0: INFO 26-04-30 01:09:37.776729 - 9:34:18 - step: 39150 acc: 0 loss: 1.516 grad: 1.61e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6022 data: 0.0919 lr: 1.61e-05 mem: 47% pow: 654.632 W 0: INFO 26-04-30 01:09:51.784653 - 9:34:32 - step: 39160 acc: 0 loss: 1.2986 grad: 1.67e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5855 data: 0.105 lr: 1.61e-05 mem: 47% pow: 648.96 W 0: INFO 26-04-30 01:10:05.394066 - 9:34:46 - step: 39170 acc: 0 loss: 1.4176 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6015 data: 0.091 lr: 1.61e-05 mem: 47% pow: 664.012 W 0: INFO 26-04-30 01:10:18.837370 - 9:34:59 - step: 39180 acc: 0 loss: 2.14 grad: 1.50e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5997 data: 0.0904 lr: 1.61e-05 mem: 47% pow: 656.164 W 0: INFO 26-04-30 01:10:32.606118 - 9:35:13 - step: 39190 acc: 0 loss: 1.4976 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6008 data: 0.0783 lr: 1.61e-05 mem: 47% pow: 660.156 W 0: INFO 26-04-30 01:10:46.286325 - 9:35:27 - step: 39200 acc: 0 loss: 0.9325 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5815 data: 0.0939 lr: 1.61e-05 mem: 47% pow: 660.779 W 0: INFO 26-04-30 01:11:02.820348 - 9:35:43 - step: 39210 acc: 0 loss: 1.3246 grad: 1.64e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5897 data: 0.0836 lr: 1.61e-05 mem: 54% pow: 660.954 W 0: INFO 26-04-30 01:11:16.685494 - 9:35:57 - step: 39220 acc: 0 loss: 0.957 grad: 1.58e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.707 data: 0.0857 lr: 1.60e-05 mem: 47% pow: 594.01 W 0: INFO 26-04-30 01:11:30.463005 - 9:36:11 - step: 39230 acc: 0 loss: 1.4263 grad: 1.53e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.629 data: 0.0854 lr: 1.60e-05 mem: 47% pow: 637.42 W 0: INFO 26-04-30 01:11:44.953786 - 9:36:25 - step: 39240 acc: 0 loss: 1.2323 grad: 1.53e-01 flops: 3.90e+14 wps: 4.52e+04 iter: 0.6042 data: 0.0864 lr: 1.60e-05 mem: 47% pow: 655.482 W 0: INFO 26-04-30 01:11:58.782299 - 9:36:39 - step: 39250 acc: 0 loss: 1.3076 grad: 1.77e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.636 data: 0.0763 lr: 1.60e-05 mem: 47% pow: 640.451 W 0: INFO 26-04-30 01:12:12.748843 - 9:36:53 - step: 39260 acc: 0 loss: 1.428 grad: 1.56e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6398 data: 0.0863 lr: 1.60e-05 mem: 47% pow: 636.7 W 0: INFO 26-04-30 01:12:26.344771 - 9:37:07 - step: 39270 acc: 0 loss: 1.0747 grad: 2.02e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5788 data: 0.0966 lr: 1.60e-05 mem: 47% pow: 665.709 W 0: INFO 26-04-30 01:12:40.224077 - 9:37:21 - step: 39280 acc: 0 loss: 1.2252 grad: 1.61e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6033 data: 0.0935 lr: 1.60e-05 mem: 47% pow: 648.935 W 0: INFO 26-04-30 01:12:53.871728 - 9:37:34 - step: 39290 acc: 0 loss: 1.6198 grad: 1.52e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5972 data: 0.0857 lr: 1.59e-05 mem: 47% pow: 672.995 W 0: INFO 26-04-30 01:13:07.505388 - 9:37:48 - step: 39300 acc: 0 loss: 1.192 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5768 data: 0.1005 lr: 1.59e-05 mem: 47% pow: 661.422 W 0: INFO 26-04-30 01:13:24.357936 - 9:38:05 - step: 39310 acc: 0 loss: 1.1103 grad: 1.56e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.596 data: 0.0756 lr: 1.59e-05 mem: 54% pow: 677.497 W 0: INFO 26-04-30 01:13:38.347326 - 9:38:19 - step: 39320 acc: 0 loss: 1.4387 grad: 1.78e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5934 data: 0.0944 lr: 1.59e-05 mem: 47% pow: 666.738 W 0: INFO 26-04-30 01:13:52.319396 - 9:38:33 - step: 39330 acc: 0 loss: 1.4132 grad: 1.58e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.629 data: 0.0859 lr: 1.59e-05 mem: 47% pow: 631.523 W 0: INFO 26-04-30 01:14:06.444955 - 9:38:47 - step: 39340 acc: 0 loss: 1.3412 grad: 1.58e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6405 data: 0.0564 lr: 1.59e-05 mem: 47% pow: 647.314 W 0: INFO 26-04-30 01:14:20.038268 - 9:39:00 - step: 39350 acc: 0 loss: 1.4132 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6142 data: 0.0813 lr: 1.58e-05 mem: 47% pow: 656.69 W 0: INFO 26-04-30 01:14:33.938151 - 9:39:14 - step: 39360 acc: 0 loss: 1.553 grad: 1.55e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.8682 data: 0.083 lr: 1.58e-05 mem: 47% pow: 512.122 W 0: INFO 26-04-30 01:14:47.621669 - 9:39:28 - step: 39370 acc: 0 loss: 1.2869 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6394 data: 0.0941 lr: 1.58e-05 mem: 47% pow: 630.955 W 0: INFO 26-04-30 01:15:01.620515 - 9:39:42 - step: 39380 acc: 0 loss: 1.2162 grad: 1.56e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6022 data: 0.1037 lr: 1.58e-05 mem: 47% pow: 653.359 W 0: INFO 26-04-30 01:15:15.195195 - 9:39:55 - step: 39390 acc: 0 loss: 1.2018 grad: 1.70e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5966 data: 0.089 lr: 1.58e-05 mem: 47% pow: 661.71 W 0: INFO 26-04-30 01:15:28.950254 - 9:40:09 - step: 39400 acc: 0 loss: 1.5059 grad: 1.54e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5811 data: 0.1222 lr: 1.58e-05 mem: 47% pow: 654.525 W 0: INFO 26-04-30 01:15:45.572647 - 9:40:26 - step: 39410 acc: 0 loss: 1.1968 grad: 1.58e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.609 data: 0.086 lr: 1.58e-05 mem: 54% pow: 652.986 W 0: INFO 26-04-30 01:15:59.193272 - 9:40:39 - step: 39420 acc: 0 loss: 1.2954 grad: 1.55e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6014 data: 0.0847 lr: 1.57e-05 mem: 47% pow: 666.361 W 0: INFO 26-04-30 01:16:13.294467 - 9:40:54 - step: 39430 acc: 0 loss: 1.4241 grad: 1.57e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6006 data: 0.0877 lr: 1.57e-05 mem: 47% pow: 665.062 W 0: INFO 26-04-30 01:16:27.176776 - 9:41:07 - step: 39440 acc: 0 loss: 1.2085 grad: 1.49e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5991 data: 0.074 lr: 1.57e-05 mem: 47% pow: 667.335 W 0: INFO 26-04-30 01:16:40.943217 - 9:41:21 - step: 39450 acc: 0 loss: 1.2949 grad: 1.64e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6149 data: 0.0582 lr: 1.57e-05 mem: 47% pow: 664.284 W 0: INFO 26-04-30 01:16:54.497686 - 9:41:35 - step: 39460 acc: 0 loss: 1.3313 grad: 1.63e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5793 data: 0.1108 lr: 1.57e-05 mem: 47% pow: 659.901 W 0: INFO 26-04-30 01:17:08.153421 - 9:41:48 - step: 39470 acc: 0 loss: 1.2486 grad: 1.55e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.7899 data: 0.0754 lr: 1.57e-05 mem: 47% pow: 561.162 W 0: INFO 26-04-30 01:17:21.926262 - 9:42:02 - step: 39480 acc: 0 loss: 1.2222 grad: 1.59e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6067 data: 0.0896 lr: 1.57e-05 mem: 47% pow: 656.546 W 0: INFO 26-04-30 01:17:35.526156 - 9:42:16 - step: 39490 acc: 0 loss: 1.2459 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.615 data: 0.0776 lr: 1.56e-05 mem: 47% pow: 660.455 W 0: INFO 26-04-30 01:17:49.209553 - 9:42:30 - step: 39500 acc: 0 loss: 1.1228 grad: 1.50e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.644 data: 0.0921 lr: 1.56e-05 mem: 47% pow: 633.184 W 0: INFO 26-04-30 01:18:06.071890 - 9:42:46 - step: 39510 acc: 0 loss: 1.1993 grad: 1.57e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.601 data: 0.0854 lr: 1.56e-05 mem: 54% pow: 662.034 W 0: INFO 26-04-30 01:18:19.831926 - 9:43:00 - step: 39520 acc: 0 loss: 1.4475 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6026 data: 0.0932 lr: 1.56e-05 mem: 47% pow: 652.289 W 0: INFO 26-04-30 01:18:33.489212 - 9:43:14 - step: 39530 acc: 0 loss: 1.1057 grad: 1.65e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6316 data: 0.07 lr: 1.56e-05 mem: 47% pow: 659.693 W 0: INFO 26-04-30 01:18:47.037055 - 9:43:27 - step: 39540 acc: 0 loss: 1.2538 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6839 data: 0.0845 lr: 1.56e-05 mem: 47% pow: 617.55 W 0: INFO 26-04-30 01:19:00.726061 - 9:43:41 - step: 39550 acc: 0 loss: 1.1702 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.591 data: 0.09 lr: 1.56e-05 mem: 47% pow: 660.192 W 0: INFO 26-04-30 01:19:14.682211 - 9:43:55 - step: 39560 acc: 0 loss: 1.2652 grad: 1.58e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6226 data: 0.0875 lr: 1.55e-05 mem: 47% pow: 637.394 W 0: INFO 26-04-30 01:19:28.316137 - 9:44:09 - step: 39570 acc: 0 loss: 1.4169 grad: 1.61e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5925 data: 0.0877 lr: 1.55e-05 mem: 47% pow: 654.46 W 0: INFO 26-04-30 01:19:42.281564 - 9:44:23 - step: 39580 acc: 0 loss: 1.0848 grad: 1.70e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6139 data: 0.0925 lr: 1.55e-05 mem: 47% pow: 655.898 W 0: INFO 26-04-30 01:19:55.927993 - 9:44:36 - step: 39590 acc: 0 loss: 1.3686 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5876 data: 0.0866 lr: 1.55e-05 mem: 47% pow: 670.715 W 0: INFO 26-04-30 01:20:09.797762 - 9:44:50 - step: 39600 acc: 0 loss: 1.0637 grad: 1.54e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6042 data: 0.0859 lr: 1.55e-05 mem: 47% pow: 657.573 W 0: INFO 26-04-30 01:20:26.734364 - 9:45:07 - step: 39610 acc: 0 loss: 1.1802 grad: 1.53e-01 flops: 3.33e+14 wps: 3.87e+04 iter: 0.6571 data: 0.0895 lr: 1.55e-05 mem: 54% pow: 626.345 W 0: INFO 26-04-30 01:20:40.760736 - 9:45:21 - step: 39620 acc: 0 loss: 1.1948 grad: 1.48e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.627 data: 0.0865 lr: 1.54e-05 mem: 47% pow: 633.632 W 0: INFO 26-04-30 01:20:54.384236 - 9:45:35 - step: 39630 acc: 0 loss: 1.412 grad: 1.63e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.591 data: 0.0969 lr: 1.54e-05 mem: 47% pow: 668.629 W 0: INFO 26-04-30 01:21:08.057214 - 9:45:48 - step: 39640 acc: 0 loss: 1.2547 grad: 1.69e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6196 data: 0.0908 lr: 1.54e-05 mem: 47% pow: 637.359 W 0: INFO 26-04-30 01:21:21.764332 - 9:46:02 - step: 39650 acc: 0 loss: 1.3209 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5838 data: 0.0869 lr: 1.54e-05 mem: 47% pow: 663.943 W 0: INFO 26-04-30 01:21:35.481714 - 9:46:16 - step: 39660 acc: 0 loss: 1.2406 grad: 1.56e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5788 data: 0.094 lr: 1.54e-05 mem: 47% pow: 660.337 W 0: INFO 26-04-30 01:21:49.516255 - 9:46:30 - step: 39670 acc: 0 loss: 1.1404 grad: 1.63e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6282 data: 0.0831 lr: 1.54e-05 mem: 47% pow: 653.852 W 0: INFO 26-04-30 01:22:03.199911 - 9:46:43 - step: 39680 acc: 0 loss: 1.0885 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6215 data: 0.0793 lr: 1.54e-05 mem: 47% pow: 673.652 W 0: INFO 26-04-30 01:22:17.002139 - 9:46:57 - step: 39690 acc: 0 loss: 1.4071 grad: 1.58e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6051 data: 0.088 lr: 1.53e-05 mem: 47% pow: 655.36 W 0: INFO 26-04-30 01:22:30.623750 - 9:47:11 - step: 39700 acc: 0 loss: 1.2933 grad: 1.44e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6906 data: 0.0632 lr: 1.53e-05 mem: 47% pow: 619.613 W 0: INFO 26-04-30 01:22:47.071633 - 9:47:27 - step: 39710 acc: 0 loss: 1.2007 grad: 1.60e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.5877 data: 0.0813 lr: 1.53e-05 mem: 54% pow: 669.001 W 0: INFO 26-04-30 01:23:00.960878 - 9:47:41 - step: 39720 acc: 0 loss: 1.2401 grad: 1.63e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6429 data: 0.0694 lr: 1.53e-05 mem: 47% pow: 641.559 W 0: INFO 26-04-30 01:23:15.227025 - 9:47:56 - step: 39730 acc: 0 loss: 1.3691 grad: 1.51e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.5932 data: 0.0887 lr: 1.53e-05 mem: 47% pow: 673.504 W 0: INFO 26-04-30 01:23:28.974064 - 9:48:09 - step: 39740 acc: 0 loss: 1.2948 grad: 1.58e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6186 data: 0.0684 lr: 1.53e-05 mem: 47% pow: 662.266 W 0: INFO 26-04-30 01:23:42.582990 - 9:48:23 - step: 39750 acc: 0 loss: 1.2264 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6184 data: 0.0888 lr: 1.53e-05 mem: 47% pow: 648.547 W 0: INFO 26-04-30 01:23:56.737439 - 9:48:37 - step: 39760 acc: 0 loss: 1.1026 grad: 1.52e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6143 data: 0.0912 lr: 1.52e-05 mem: 47% pow: 647.531 W 0: INFO 26-04-30 01:24:10.535933 - 9:48:51 - step: 39770 acc: 0 loss: 1.7206 grad: 1.74e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.614 data: 0.0844 lr: 1.52e-05 mem: 47% pow: 651.136 W 0: INFO 26-04-30 01:24:24.363671 - 9:49:05 - step: 39780 acc: 0 loss: 1.3681 grad: 1.53e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6052 data: 0.0858 lr: 1.52e-05 mem: 47% pow: 655.345 W 0: INFO 26-04-30 01:24:37.904855 - 9:49:18 - step: 39790 acc: 0 loss: 1.5031 grad: 1.61e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5984 data: 0.0916 lr: 1.52e-05 mem: 47% pow: 653.247 W 0: INFO 26-04-30 01:24:51.952687 - 9:49:32 - step: 39800 acc: 0 loss: 1.2688 grad: 1.48e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.5948 data: 0.0861 lr: 1.52e-05 mem: 47% pow: 662.443 W 0: INFO 26-04-30 01:25:08.539909 - 9:49:49 - step: 39810 acc: 0 loss: 1.5961 grad: 1.60e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.595 data: 0.0789 lr: 1.52e-05 mem: 54% pow: 666.004 W 0: INFO 26-04-30 01:25:22.071796 - 9:50:02 - step: 39820 acc: 0 loss: 1.2546 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6172 data: 0.0884 lr: 1.51e-05 mem: 47% pow: 647.055 W 0: INFO 26-04-30 01:25:35.821244 - 9:50:16 - step: 39830 acc: 0 loss: 1.16 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5946 data: 0.0922 lr: 1.51e-05 mem: 47% pow: 658.067 W 0: INFO 26-04-30 01:25:49.589795 - 9:50:30 - step: 39840 acc: 0 loss: 1.2724 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6152 data: 0.0826 lr: 1.51e-05 mem: 47% pow: 647.088 W 0: INFO 26-04-30 01:26:03.268839 - 9:50:44 - step: 39850 acc: 0 loss: 1.207 grad: 1.66e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5871 data: 0.09 lr: 1.51e-05 mem: 47% pow: 664.383 W 0: INFO 26-04-30 01:26:17.139270 - 9:50:57 - step: 39860 acc: 0 loss: 1.0639 grad: 1.60e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5809 data: 0.0942 lr: 1.51e-05 mem: 47% pow: 664.983 W 0: INFO 26-04-30 01:26:31.055864 - 9:51:11 - step: 39870 acc: 0 loss: 0.9424 grad: 1.58e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.625 data: 0.0911 lr: 1.51e-05 mem: 47% pow: 638.733 W 0: INFO 26-04-30 01:26:45.031954 - 9:51:25 - step: 39880 acc: 0 loss: 1.2945 grad: 1.53e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5952 data: 0.0851 lr: 1.51e-05 mem: 47% pow: 660.266 W 0: INFO 26-04-30 01:26:58.557642 - 9:51:39 - step: 39890 acc: 0 loss: 1.2125 grad: 1.48e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6025 data: 0.0885 lr: 1.50e-05 mem: 47% pow: 655.702 W 0: INFO 26-04-30 01:27:12.178518 - 9:51:52 - step: 39900 acc: 0 loss: 1.5647 grad: 1.53e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5953 data: 0.089 lr: 1.50e-05 mem: 47% pow: 662.662 W 0: INFO 26-04-30 01:27:28.878249 - 9:52:09 - step: 39910 acc: 0 loss: 0.8147 grad: 1.57e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5985 data: 0.0912 lr: 1.50e-05 mem: 54% pow: 666.212 W 0: INFO 26-04-30 01:27:42.434222 - 9:52:23 - step: 39920 acc: 0 loss: 1.0025 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5919 data: 0.0934 lr: 1.50e-05 mem: 47% pow: 657.132 W 0: INFO 26-04-30 01:27:56.186230 - 9:52:36 - step: 39930 acc: 0 loss: 1.3231 grad: 1.56e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5937 data: 0.0778 lr: 1.50e-05 mem: 47% pow: 666.725 W 0: INFO 26-04-30 01:28:09.917671 - 9:52:50 - step: 39940 acc: 0 loss: 1.3138 grad: 1.50e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.578 data: 0.1267 lr: 1.50e-05 mem: 47% pow: 643.437 W 0: INFO 26-04-30 01:28:23.629660 - 9:53:04 - step: 39950 acc: 0 loss: 0.9815 grad: 1.63e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5907 data: 0.0857 lr: 1.50e-05 mem: 47% pow: 657.908 W 0: INFO 26-04-30 01:28:37.263333 - 9:53:18 - step: 39960 acc: 0 loss: 1.1591 grad: 1.52e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5786 data: 0.0906 lr: 1.49e-05 mem: 47% pow: 674.999 W 0: INFO 26-04-30 01:28:50.924333 - 9:53:31 - step: 39970 acc: 0 loss: 1.057 grad: 1.61e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6002 data: 0.0842 lr: 1.49e-05 mem: 47% pow: 666.54 W 0: INFO 26-04-30 01:29:04.618116 - 9:53:45 - step: 39980 acc: 0 loss: 1.5646 grad: 1.57e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5813 data: 0.0911 lr: 1.49e-05 mem: 47% pow: 664.037 W 0: INFO 26-04-30 01:29:18.301952 - 9:53:59 - step: 39990 acc: 0 loss: 1.2001 grad: 1.71e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6308 data: 0.0973 lr: 1.49e-05 mem: 47% pow: 638.028 W 0: INFO 26-04-30 01:29:31.931371 - 9:54:12 - step: 40000 acc: 0 loss: 1.063 grad: 1.76e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6118 data: 0.0924 lr: 1.49e-05 mem: 47% pow: 649.577 W 0: INFO 26-04-30 01:29:31.934382 - 9:54:12 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000040000 0: INFO 26-04-30 01:29:31.934965 - 9:54:12 - Saving... 0: INFO 26-04-30 01:29:37.900658 - 9:54:18 - State dict saved! 0: INFO 26-04-30 01:29:37.990409 - 9:54:18 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000040000/train_state_00000.json 0: INFO 26-04-30 01:29:37.994477 - 9:54:18 - Train state saved ! 0: INFO 26-04-30 01:29:37.994683 - 9:54:18 - Cleaning up checkpoints... 0: INFO 26-04-30 01:29:37.994842 - 9:54:18 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000035000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000040000')] 0: INFO 26-04-30 01:29:37.995020 - 9:54:18 - Eval folders: [] 0: INFO 26-04-30 01:29:37.995140 - 9:54:18 - Other folders: [] 0: INFO 26-04-30 01:29:37.995275 - 9:54:18 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000035000')} 0: INFO 26-04-30 01:29:42.100536 - 9:54:22 - garbage collection 0: INFO 26-04-30 01:29:56.577467 - 9:54:37 - step: 40010 acc: 0 loss: 1.3088 grad: 1.51e-01 flops: 2.29e+14 wps: 2.66e+04 iter: 0.6775 data: 0.0696 lr: 1.49e-05 mem: 54% pow: 629.299 W 0: INFO 26-04-30 01:30:10.139959 - 9:54:50 - step: 40020 acc: 0 loss: 1.193 grad: 1.52e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5887 data: 0.0854 lr: 1.49e-05 mem: 47% pow: 661.569 W 0: INFO 26-04-30 01:30:24.080528 - 9:55:04 - step: 40030 acc: 0 loss: 1.2794 grad: 1.50e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7776 data: 0.0945 lr: 1.48e-05 mem: 47% pow: 552.38 W 0: INFO 26-04-30 01:30:37.612395 - 9:55:18 - step: 40040 acc: 0 loss: 1.073 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5966 data: 0.0893 lr: 1.48e-05 mem: 47% pow: 659.32 W 0: INFO 26-04-30 01:30:51.155592 - 9:55:31 - step: 40050 acc: 0 loss: 1.2713 grad: 1.79e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6054 data: 0.0949 lr: 1.48e-05 mem: 47% pow: 645.578 W 0: INFO 26-04-30 01:31:04.913659 - 9:55:45 - step: 40060 acc: 0 loss: 1.3479 grad: 1.57e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.6358 data: 0.0837 lr: 1.48e-05 mem: 47% pow: 658.496 W 0: INFO 26-04-30 01:31:18.524629 - 9:55:59 - step: 40070 acc: 0 loss: 1.1991 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6306 data: 0.0873 lr: 1.48e-05 mem: 47% pow: 627.432 W 0: INFO 26-04-30 01:31:32.109789 - 9:56:12 - step: 40080 acc: 0 loss: 1.3393 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5991 data: 0.0834 lr: 1.48e-05 mem: 47% pow: 658.329 W 0: INFO 26-04-30 01:31:45.775685 - 9:56:26 - step: 40090 acc: 0 loss: 1.1999 grad: 1.52e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5907 data: 0.0913 lr: 1.47e-05 mem: 47% pow: 658.752 W 0: INFO 26-04-30 01:31:59.538559 - 9:56:40 - step: 40100 acc: 0 loss: 1.2852 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6513 data: 0.0896 lr: 1.47e-05 mem: 47% pow: 617.185 W 0: INFO 26-04-30 01:32:16.321414 - 9:56:57 - step: 40110 acc: 0 loss: 1.3508 grad: 1.58e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6326 data: 0.0806 lr: 1.47e-05 mem: 54% pow: 637.807 W 0: INFO 26-04-30 01:32:29.869879 - 9:57:10 - step: 40120 acc: 0 loss: 1.7894 grad: 1.70e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5838 data: 0.1062 lr: 1.47e-05 mem: 47% pow: 659.759 W 0: INFO 26-04-30 01:32:44.106082 - 9:57:24 - step: 40130 acc: 0 loss: 1.6161 grad: 1.53e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.5806 data: 0.1354 lr: 1.47e-05 mem: 47% pow: 651.889 W 0: INFO 26-04-30 01:32:57.871917 - 9:57:38 - step: 40140 acc: 0 loss: 1.297 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5921 data: 0.091 lr: 1.47e-05 mem: 47% pow: 662.33 W 0: INFO 26-04-30 01:33:11.837019 - 9:57:52 - step: 40150 acc: 0 loss: 1.3304 grad: 1.67e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.7319 data: 0.0928 lr: 1.47e-05 mem: 47% pow: 587.012 W 0: INFO 26-04-30 01:33:25.653165 - 9:58:06 - step: 40160 acc: 0 loss: 1.1983 grad: 1.55e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5946 data: 0.092 lr: 1.46e-05 mem: 47% pow: 661.527 W 0: INFO 26-04-30 01:33:39.105232 - 9:58:19 - step: 40170 acc: 0 loss: 1.4929 grad: 1.62e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5839 data: 0.0851 lr: 1.46e-05 mem: 47% pow: 671.826 W 0: INFO 26-04-30 01:33:53.083608 - 9:58:33 - step: 40180 acc: 0 loss: 1.3113 grad: 1.61e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5791 data: 0.0912 lr: 1.46e-05 mem: 47% pow: 661.055 W 0: INFO 26-04-30 01:34:06.662761 - 9:58:47 - step: 40190 acc: 0 loss: 1.2927 grad: 1.65e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5877 data: 0.0967 lr: 1.46e-05 mem: 47% pow: 654.041 W 0: INFO 26-04-30 01:34:20.325616 - 9:59:01 - step: 40200 acc: 0 loss: 1.6884 grad: 1.56e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5974 data: 0.0812 lr: 1.46e-05 mem: 47% pow: 659.784 W 0: INFO 26-04-30 01:34:37.013663 - 9:59:17 - step: 40210 acc: 0 loss: 1.4501 grad: 1.65e-01 flops: 3.38e+14 wps: 3.93e+04 iter: 0.6089 data: 0.0923 lr: 1.46e-05 mem: 54% pow: 649.098 W 0: INFO 26-04-30 01:34:51.156514 - 9:59:31 - step: 40220 acc: 0 loss: 1.4129 grad: 1.46e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.592 data: 0.0913 lr: 1.46e-05 mem: 47% pow: 670.339 W 0: INFO 26-04-30 01:35:04.805506 - 9:59:45 - step: 40230 acc: 0 loss: 1.4097 grad: 1.53e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6175 data: 0.0799 lr: 1.45e-05 mem: 47% pow: 654.299 W 0: INFO 26-04-30 01:35:18.552114 - 9:59:59 - step: 40240 acc: 0 loss: 1.4702 grad: 1.61e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.609 data: 0.0836 lr: 1.45e-05 mem: 47% pow: 649.958 W 0: INFO 26-04-30 01:35:32.157314 - 10:00:12 - step: 40250 acc: 0 loss: 1.2986 grad: 1.61e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6186 data: 0.0892 lr: 1.45e-05 mem: 47% pow: 647.099 W 0: INFO 26-04-30 01:35:45.729427 - 10:00:26 - step: 40260 acc: 0 loss: 1.5661 grad: 1.59e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6358 data: 0.0928 lr: 1.45e-05 mem: 47% pow: 644.846 W 0: INFO 26-04-30 01:35:59.281414 - 10:00:40 - step: 40270 acc: 0 loss: 1.3881 grad: 1.62e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5791 data: 0.1107 lr: 1.45e-05 mem: 47% pow: 651.236 W 0: INFO 26-04-30 01:36:12.927936 - 10:00:53 - step: 40280 acc: 0 loss: 1.4654 grad: 1.63e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6025 data: 0.0894 lr: 1.45e-05 mem: 47% pow: 667.871 W 0: INFO 26-04-30 01:36:26.615238 - 10:01:07 - step: 40290 acc: 0 loss: 1.5351 grad: 1.58e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.58 data: 0.1062 lr: 1.44e-05 mem: 47% pow: 670.788 W 0: INFO 26-04-30 01:36:40.381378 - 10:01:21 - step: 40300 acc: 0 loss: 1.3104 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7318 data: 0.0784 lr: 1.44e-05 mem: 47% pow: 583.882 W 0: INFO 26-04-30 01:36:57.021081 - 10:01:37 - step: 40310 acc: 0 loss: 1.3243 grad: 1.49e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6103 data: 0.0637 lr: 1.44e-05 mem: 54% pow: 665.679 W 0: INFO 26-04-30 01:37:10.601150 - 10:01:51 - step: 40320 acc: 0 loss: 1.1656 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5974 data: 0.0953 lr: 1.44e-05 mem: 47% pow: 652.708 W 0: INFO 26-04-30 01:37:24.227337 - 10:02:05 - step: 40330 acc: 0 loss: 1.5697 grad: 1.61e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6101 data: 0.0859 lr: 1.44e-05 mem: 47% pow: 650.8 W 0: INFO 26-04-30 01:37:38.400779 - 10:02:19 - step: 40340 acc: 0 loss: 1.5846 grad: 1.56e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.8442 data: 0.0883 lr: 1.44e-05 mem: 47% pow: 527.199 W 0: INFO 26-04-30 01:37:51.986464 - 10:02:32 - step: 40350 acc: 0 loss: 1.0613 grad: 1.64e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6125 data: 0.0903 lr: 1.44e-05 mem: 47% pow: 646.548 W 0: INFO 26-04-30 01:38:05.650494 - 10:02:46 - step: 40360 acc: 0 loss: 1.1337 grad: 1.55e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6188 data: 0.0952 lr: 1.43e-05 mem: 47% pow: 637.236 W 0: INFO 26-04-30 01:38:19.256104 - 10:03:00 - step: 40370 acc: 0 loss: 1.02 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6127 data: 0.0837 lr: 1.43e-05 mem: 47% pow: 666.063 W 0: INFO 26-04-30 01:38:32.659675 - 10:03:13 - step: 40380 acc: 0 loss: 1.244 grad: 1.55e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.601 data: 0.087 lr: 1.43e-05 mem: 47% pow: 654.565 W 0: INFO 26-04-30 01:38:46.250529 - 10:03:27 - step: 40390 acc: 0 loss: 1.4979 grad: 1.59e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6086 data: 0.0877 lr: 1.43e-05 mem: 47% pow: 643.476 W 0: INFO 26-04-30 01:39:00.014142 - 10:03:40 - step: 40400 acc: 0 loss: 1.2282 grad: 1.69e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6243 data: 0.0774 lr: 1.43e-05 mem: 47% pow: 669.207 W 0: INFO 26-04-30 01:39:16.518312 - 10:03:57 - step: 40410 acc: 0 loss: 1.4154 grad: 1.69e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6185 data: 0.0865 lr: 1.43e-05 mem: 54% pow: 646.21 W 0: INFO 26-04-30 01:39:30.042284 - 10:04:10 - step: 40420 acc: 0 loss: 1.2244 grad: 1.55e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5817 data: 0.087 lr: 1.43e-05 mem: 47% pow: 664.469 W 0: INFO 26-04-30 01:39:43.955768 - 10:04:24 - step: 40430 acc: 0 loss: 1.1182 grad: 1.53e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6453 data: 0.0821 lr: 1.42e-05 mem: 47% pow: 645.396 W 0: INFO 26-04-30 01:39:57.708803 - 10:04:38 - step: 40440 acc: 0 loss: 1.4269 grad: 1.81e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6102 data: 0.0802 lr: 1.42e-05 mem: 47% pow: 652.829 W 0: INFO 26-04-30 01:40:11.783350 - 10:04:52 - step: 40450 acc: 0 loss: 1.3979 grad: 1.70e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5809 data: 0.0934 lr: 1.42e-05 mem: 47% pow: 666.491 W 0: INFO 26-04-30 01:40:25.271514 - 10:05:06 - step: 40460 acc: 0 loss: 1.2305 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.595 data: 0.0836 lr: 1.42e-05 mem: 47% pow: 660.286 W 0: INFO 26-04-30 01:40:39.004165 - 10:05:19 - step: 40470 acc: 0 loss: 1.6579 grad: 1.90e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5872 data: 0.0888 lr: 1.42e-05 mem: 47% pow: 664.846 W 0: INFO 26-04-30 01:40:52.501421 - 10:05:33 - step: 40480 acc: 0 loss: 1.5404 grad: 1.62e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5801 data: 0.0879 lr: 1.42e-05 mem: 47% pow: 670.628 W 0: INFO 26-04-30 01:41:06.131479 - 10:05:46 - step: 40490 acc: 0 loss: 1.1367 grad: 1.63e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5858 data: 0.0863 lr: 1.42e-05 mem: 47% pow: 673.564 W 0: INFO 26-04-30 01:41:19.765716 - 10:06:00 - step: 40500 acc: 0 loss: 1.2763 grad: 1.77e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6583 data: 0.0734 lr: 1.41e-05 mem: 47% pow: 634.138 W 0: INFO 26-04-30 01:41:36.332455 - 10:06:17 - step: 40510 acc: 0 loss: 1.5168 grad: 1.61e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.5879 data: 0.0897 lr: 1.41e-05 mem: 54% pow: 654.927 W 0: INFO 26-04-30 01:41:50.028559 - 10:06:30 - step: 40520 acc: 0 loss: 0.9576 grad: 1.61e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6027 data: 0.0841 lr: 1.41e-05 mem: 47% pow: 676.583 W 0: INFO 26-04-30 01:42:03.616256 - 10:06:44 - step: 40530 acc: 0 loss: 1.2382 grad: 1.55e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6155 data: 0.0868 lr: 1.41e-05 mem: 47% pow: 652.421 W 0: INFO 26-04-30 01:42:17.262089 - 10:06:58 - step: 40540 acc: 0 loss: 1.3063 grad: 1.61e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6017 data: 0.0922 lr: 1.41e-05 mem: 47% pow: 656.073 W 0: INFO 26-04-30 01:42:31.045162 - 10:07:11 - step: 40550 acc: 0 loss: 1.4148 grad: 1.63e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5806 data: 0.1132 lr: 1.41e-05 mem: 47% pow: 666.741 W 0: INFO 26-04-30 01:42:44.743733 - 10:07:25 - step: 40560 acc: 0 loss: 1.2431 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.592 data: 0.0832 lr: 1.40e-05 mem: 47% pow: 662.811 W 0: INFO 26-04-30 01:42:58.300537 - 10:07:39 - step: 40570 acc: 0 loss: 1.2119 grad: 1.85e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6037 data: 0.1044 lr: 1.40e-05 mem: 47% pow: 658.55 W 0: INFO 26-04-30 01:43:12.172824 - 10:07:52 - step: 40580 acc: 0 loss: 1.2041 grad: 1.60e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5986 data: 0.0953 lr: 1.40e-05 mem: 47% pow: 665.266 W 0: INFO 26-04-30 01:43:25.957615 - 10:08:06 - step: 40590 acc: 0 loss: 1.3308 grad: 1.50e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6313 data: 0.0735 lr: 1.40e-05 mem: 47% pow: 644.13 W 0: INFO 26-04-30 01:43:39.675060 - 10:08:20 - step: 40600 acc: 0 loss: 1.265 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5922 data: 0.0885 lr: 1.40e-05 mem: 47% pow: 658.17 W 0: INFO 26-04-30 01:43:56.269313 - 10:08:37 - step: 40610 acc: 0 loss: 1.3072 grad: 1.65e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.5906 data: 0.0893 lr: 1.40e-05 mem: 54% pow: 654.808 W 0: INFO 26-04-30 01:44:09.977475 - 10:08:50 - step: 40620 acc: 0 loss: 1.3072 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5911 data: 0.0887 lr: 1.40e-05 mem: 47% pow: 670.144 W 0: INFO 26-04-30 01:44:23.805367 - 10:09:04 - step: 40630 acc: 0 loss: 1.4904 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6241 data: 0.0924 lr: 1.39e-05 mem: 47% pow: 637.579 W 0: INFO 26-04-30 01:44:38.274409 - 10:09:19 - step: 40640 acc: 0 loss: 1.4751 grad: 1.53e-01 flops: 3.91e+14 wps: 4.53e+04 iter: 0.5843 data: 0.1139 lr: 1.39e-05 mem: 47% pow: 641.779 W 0: INFO 26-04-30 01:44:51.875575 - 10:09:32 - step: 40650 acc: 0 loss: 1.6586 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.602 data: 0.0839 lr: 1.39e-05 mem: 47% pow: 665.965 W 0: INFO 26-04-30 01:45:05.595681 - 10:09:46 - step: 40660 acc: 0 loss: 1.4899 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7459 data: 0.0781 lr: 1.39e-05 mem: 47% pow: 582.6 W 0: INFO 26-04-30 01:45:19.258424 - 10:10:00 - step: 40670 acc: 0 loss: 1.3638 grad: 1.56e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5781 data: 0.1003 lr: 1.39e-05 mem: 47% pow: 660.493 W 0: INFO 26-04-30 01:45:32.853363 - 10:10:13 - step: 40680 acc: 0 loss: 0.96 grad: 1.53e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5887 data: 0.0887 lr: 1.39e-05 mem: 47% pow: 660.769 W 0: INFO 26-04-30 01:45:46.530300 - 10:10:27 - step: 40690 acc: 0 loss: 1.1765 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6241 data: 0.0712 lr: 1.39e-05 mem: 47% pow: 648.574 W 0: INFO 26-04-30 01:46:00.357197 - 10:10:41 - step: 40700 acc: 0 loss: 1.6317 grad: 1.64e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6223 data: 0.0841 lr: 1.38e-05 mem: 47% pow: 642.223 W 0: INFO 26-04-30 01:46:16.961421 - 10:10:57 - step: 40710 acc: 0 loss: 1.7268 grad: 1.53e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6068 data: 0.0879 lr: 1.38e-05 mem: 54% pow: 651.918 W 0: INFO 26-04-30 01:46:30.674258 - 10:11:11 - step: 40720 acc: 0 loss: 1.6015 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5938 data: 0.0903 lr: 1.38e-05 mem: 47% pow: 663.008 W 0: INFO 26-04-30 01:46:44.405668 - 10:11:25 - step: 40730 acc: 0 loss: 1.2095 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6394 data: 0.0866 lr: 1.38e-05 mem: 47% pow: 637.49 W 0: INFO 26-04-30 01:46:58.026460 - 10:11:38 - step: 40740 acc: 0 loss: 1.2475 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6407 data: 0.0897 lr: 1.38e-05 mem: 47% pow: 632.432 W 0: INFO 26-04-30 01:47:11.640764 - 10:11:52 - step: 40750 acc: 0 loss: 1.3212 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5825 data: 0.1023 lr: 1.38e-05 mem: 47% pow: 660.69 W 0: INFO 26-04-30 01:47:25.358864 - 10:12:06 - step: 40760 acc: 0 loss: 1.1839 grad: 1.54e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.589 data: 0.08 lr: 1.38e-05 mem: 47% pow: 674.098 W 0: INFO 26-04-30 01:47:39.049863 - 10:12:19 - step: 40770 acc: 0 loss: 1.5064 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6071 data: 0.0881 lr: 1.37e-05 mem: 47% pow: 648.012 W 0: INFO 26-04-30 01:47:52.681961 - 10:12:33 - step: 40780 acc: 0 loss: 1.4277 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6716 data: 0.0946 lr: 1.37e-05 mem: 47% pow: 614.967 W 0: INFO 26-04-30 01:48:06.484685 - 10:12:47 - step: 40790 acc: 0 loss: 1.2838 grad: 1.64e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6783 data: 0.0966 lr: 1.37e-05 mem: 47% pow: 607.739 W 0: INFO 26-04-30 01:48:20.186205 - 10:13:00 - step: 40800 acc: 0 loss: 1.2418 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6017 data: 0.0873 lr: 1.37e-05 mem: 47% pow: 670.582 W 0: INFO 26-04-30 01:48:36.836061 - 10:13:17 - step: 40810 acc: 0 loss: 1.5273 grad: 1.64e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5876 data: 0.0913 lr: 1.37e-05 mem: 54% pow: 663.62 W 0: INFO 26-04-30 01:48:50.438417 - 10:13:31 - step: 40820 acc: 0 loss: 1.6115 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5973 data: 0.0891 lr: 1.37e-05 mem: 47% pow: 662.403 W 0: INFO 26-04-30 01:49:04.164559 - 10:13:44 - step: 40830 acc: 0 loss: 1.7877 grad: 1.61e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6077 data: 0.0848 lr: 1.36e-05 mem: 47% pow: 653.745 W 0: INFO 26-04-30 01:49:17.908430 - 10:13:58 - step: 40840 acc: 0 loss: 1.1848 grad: 1.54e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.585 data: 0.0872 lr: 1.36e-05 mem: 47% pow: 670.072 W 0: INFO 26-04-30 01:49:31.685522 - 10:14:12 - step: 40850 acc: 0 loss: 1.3963 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.592 data: 0.0814 lr: 1.36e-05 mem: 47% pow: 664.476 W 0: INFO 26-04-30 01:49:45.129011 - 10:14:25 - step: 40860 acc: 0 loss: 1.0871 grad: 1.55e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6018 data: 0.0858 lr: 1.36e-05 mem: 47% pow: 664.322 W 0: INFO 26-04-30 01:49:58.945330 - 10:14:39 - step: 40870 acc: 0 loss: 1.4798 grad: 1.59e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6018 data: 0.0846 lr: 1.36e-05 mem: 47% pow: 654.432 W 0: INFO 26-04-30 01:50:12.733844 - 10:14:53 - step: 40880 acc: 0 loss: 1.3418 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6011 data: 0.0743 lr: 1.36e-05 mem: 47% pow: 660.711 W 0: INFO 26-04-30 01:50:26.341462 - 10:15:07 - step: 40890 acc: 0 loss: 1.2315 grad: 1.57e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5905 data: 0.0929 lr: 1.36e-05 mem: 47% pow: 659.549 W 0: INFO 26-04-30 01:50:39.880235 - 10:15:20 - step: 40900 acc: 0 loss: 1.15 grad: 1.56e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6232 data: 0.087 lr: 1.35e-05 mem: 47% pow: 646.452 W 0: INFO 26-04-30 01:50:56.545973 - 10:15:37 - step: 40910 acc: 0 loss: 1.5085 grad: 1.52e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5999 data: 0.089 lr: 1.35e-05 mem: 54% pow: 661.918 W 0: INFO 26-04-30 01:51:10.244996 - 10:15:51 - step: 40920 acc: 0 loss: 1.0519 grad: 1.59e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6175 data: 0.0935 lr: 1.35e-05 mem: 47% pow: 640.174 W 0: INFO 26-04-30 01:51:24.022189 - 10:16:04 - step: 40930 acc: 0 loss: 1.2667 grad: 1.55e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5998 data: 0.0854 lr: 1.35e-05 mem: 47% pow: 662.075 W 0: INFO 26-04-30 01:51:37.440103 - 10:16:18 - step: 40940 acc: 0 loss: 1.2007 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5994 data: 0.0886 lr: 1.35e-05 mem: 47% pow: 671.082 W 0: INFO 26-04-30 01:51:51.035735 - 10:16:31 - step: 40950 acc: 0 loss: 1.4044 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6404 data: 0.0791 lr: 1.35e-05 mem: 47% pow: 634.967 W 0: INFO 26-04-30 01:52:04.886081 - 10:16:45 - step: 40960 acc: 0 loss: 1.4339 grad: 1.54e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6482 data: 0.0784 lr: 1.35e-05 mem: 47% pow: 639.188 W 0: INFO 26-04-30 01:52:18.622578 - 10:16:59 - step: 40970 acc: 0 loss: 1.3597 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5984 data: 0.0916 lr: 1.34e-05 mem: 47% pow: 653.857 W 0: INFO 26-04-30 01:52:32.366440 - 10:17:13 - step: 40980 acc: 0 loss: 1.4364 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6068 data: 0.0815 lr: 1.34e-05 mem: 47% pow: 661.912 W 0: INFO 26-04-30 01:52:46.100934 - 10:17:26 - step: 40990 acc: 0 loss: 1.5405 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6584 data: 0.0868 lr: 1.34e-05 mem: 47% pow: 627.792 W 0: INFO 26-04-30 01:52:59.605956 - 10:17:40 - step: 41000 acc: 0 loss: 1.3274 grad: 1.58e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5913 data: 0.0927 lr: 1.34e-05 mem: 47% pow: 665.267 W 0: INFO 26-04-30 01:53:03.319444 - 10:17:44 - garbage collection 0: INFO 26-04-30 01:53:17.617075 - 10:17:58 - step: 41010 acc: 0 loss: 1.4729 grad: 1.50e-01 flops: 3.14e+14 wps: 3.64e+04 iter: 0.5976 data: 0.0869 lr: 1.34e-05 mem: 54% pow: 662.04 W 0: INFO 26-04-30 01:53:31.242217 - 10:18:12 - step: 41020 acc: 0 loss: 1.568 grad: 1.54e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5891 data: 0.0887 lr: 1.34e-05 mem: 47% pow: 663.457 W 0: INFO 26-04-30 01:53:44.878574 - 10:18:25 - step: 41030 acc: 0 loss: 1.3751 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6198 data: 0.1061 lr: 1.33e-05 mem: 47% pow: 638.167 W 0: INFO 26-04-30 01:53:58.417295 - 10:18:39 - step: 41040 acc: 0 loss: 1.3215 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6156 data: 0.0864 lr: 1.33e-05 mem: 47% pow: 656.945 W 0: INFO 26-04-30 01:54:12.273770 - 10:18:53 - step: 41050 acc: 0 loss: 1.2629 grad: 1.54e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.8691 data: 0.0682 lr: 1.33e-05 mem: 47% pow: 513.379 W 0: INFO 26-04-30 01:54:26.070724 - 10:19:06 - step: 41060 acc: 0 loss: 1.1071 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5994 data: 0.0783 lr: 1.33e-05 mem: 47% pow: 663.112 W 0: INFO 26-04-30 01:54:39.699020 - 10:19:20 - step: 41070 acc: 0 loss: 1.0115 grad: 1.56e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6046 data: 0.0847 lr: 1.33e-05 mem: 47% pow: 680.162 W 0: INFO 26-04-30 01:54:53.424792 - 10:19:34 - step: 41080 acc: 0 loss: 1.4464 grad: 1.66e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5873 data: 0.0854 lr: 1.33e-05 mem: 47% pow: 672.355 W 0: INFO 26-04-30 01:55:07.041194 - 10:19:47 - step: 41090 acc: 0 loss: 1.0608 grad: 1.56e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5895 data: 0.0879 lr: 1.33e-05 mem: 47% pow: 658.231 W 0: INFO 26-04-30 01:55:20.840261 - 10:20:01 - step: 41100 acc: 0 loss: 1.7103 grad: 1.56e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6018 data: 0.0859 lr: 1.32e-05 mem: 47% pow: 659.952 W 0: INFO 26-04-30 01:55:37.549499 - 10:20:18 - step: 41110 acc: 0 loss: 1.42 grad: 1.63e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.7191 data: 0.0877 lr: 1.32e-05 mem: 54% pow: 594.603 W 0: INFO 26-04-30 01:55:51.370024 - 10:20:32 - step: 41120 acc: 0 loss: 1.1399 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.647 data: 0.0899 lr: 1.32e-05 mem: 47% pow: 623.655 W 0: INFO 26-04-30 01:56:05.222586 - 10:20:46 - step: 41130 acc: 0 loss: 1.678 grad: 1.57e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6247 data: 0.0618 lr: 1.32e-05 mem: 47% pow: 658.633 W 0: INFO 26-04-30 01:56:18.828218 - 10:20:59 - step: 41140 acc: 0 loss: 1.6768 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5892 data: 0.0991 lr: 1.32e-05 mem: 47% pow: 678.582 W 0: INFO 26-04-30 01:56:32.482393 - 10:21:13 - step: 41150 acc: 0 loss: 1.2166 grad: 1.51e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.616 data: 0.0906 lr: 1.32e-05 mem: 47% pow: 646.987 W 0: INFO 26-04-30 01:56:45.968611 - 10:21:26 - step: 41160 acc: 0 loss: 1.3013 grad: 1.59e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6294 data: 0.0805 lr: 1.32e-05 mem: 47% pow: 640.996 W 0: INFO 26-04-30 01:56:59.530431 - 10:21:40 - step: 41170 acc: 0 loss: 1.4329 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5802 data: 0.0976 lr: 1.31e-05 mem: 47% pow: 662.106 W 0: INFO 26-04-30 01:57:13.249848 - 10:21:54 - step: 41180 acc: 0 loss: 1.1964 grad: 1.59e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5916 data: 0.0902 lr: 1.31e-05 mem: 47% pow: 684.819 W 0: INFO 26-04-30 01:57:27.003738 - 10:22:07 - step: 41190 acc: 0 loss: 1.3501 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6308 data: 0.0599 lr: 1.31e-05 mem: 47% pow: 655.4 W 0: INFO 26-04-30 01:57:41.449629 - 10:22:22 - step: 41200 acc: 0 loss: 1.2658 grad: 1.52e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.5848 data: 0.0907 lr: 1.31e-05 mem: 47% pow: 666.243 W 0: INFO 26-04-30 01:57:57.880037 - 10:22:38 - step: 41210 acc: 0 loss: 1.3222 grad: 1.57e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.583 data: 0.1027 lr: 1.31e-05 mem: 54% pow: 663.339 W 0: INFO 26-04-30 01:58:11.412206 - 10:22:52 - step: 41220 acc: 0 loss: 1.2875 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.589 data: 0.1006 lr: 1.31e-05 mem: 47% pow: 660.616 W 0: INFO 26-04-30 01:58:25.045925 - 10:23:05 - step: 41230 acc: 0 loss: 1.2715 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6141 data: 0.0716 lr: 1.31e-05 mem: 47% pow: 661.437 W 0: INFO 26-04-30 01:58:38.570312 - 10:23:19 - step: 41240 acc: 0 loss: 1.5948 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6075 data: 0.0895 lr: 1.30e-05 mem: 47% pow: 651.383 W 0: INFO 26-04-30 01:58:52.071689 - 10:23:32 - step: 41250 acc: 0 loss: 1.1345 grad: 1.55e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5889 data: 0.0963 lr: 1.30e-05 mem: 47% pow: 671.885 W 0: INFO 26-04-30 01:59:05.523302 - 10:23:46 - step: 41260 acc: 0 loss: 1.2797 grad: 1.52e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5972 data: 0.093 lr: 1.30e-05 mem: 47% pow: 657.503 W 0: INFO 26-04-30 01:59:18.940820 - 10:23:59 - step: 41270 acc: 0 loss: 1.2302 grad: 1.49e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6063 data: 0.0793 lr: 1.30e-05 mem: 47% pow: 666.227 W 0: INFO 26-04-30 01:59:32.627432 - 10:24:13 - step: 41280 acc: 0 loss: 1.3884 grad: 1.65e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6099 data: 0.0866 lr: 1.30e-05 mem: 47% pow: 654.376 W 0: INFO 26-04-30 01:59:46.112337 - 10:24:26 - step: 41290 acc: 0 loss: 1.3097 grad: 1.62e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5803 data: 0.0898 lr: 1.30e-05 mem: 47% pow: 671.349 W 0: INFO 26-04-30 01:59:59.695661 - 10:24:40 - step: 41300 acc: 0 loss: 1.3245 grad: 1.59e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6008 data: 0.082 lr: 1.29e-05 mem: 47% pow: 659.911 W 0: INFO 26-04-30 02:00:16.301630 - 10:24:57 - step: 41310 acc: 0 loss: 1.678 grad: 1.53e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6331 data: 0.0917 lr: 1.29e-05 mem: 54% pow: 633.15 W 0: INFO 26-04-30 02:00:29.847842 - 10:25:10 - step: 41320 acc: 0 loss: 1.3225 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5994 data: 0.0915 lr: 1.29e-05 mem: 47% pow: 651.845 W 0: INFO 26-04-30 02:00:43.354681 - 10:25:24 - step: 41330 acc: 0 loss: 1.3132 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5982 data: 0.0844 lr: 1.29e-05 mem: 47% pow: 659.534 W 0: INFO 26-04-30 02:00:56.774613 - 10:25:37 - step: 41340 acc: 0 loss: 1.1829 grad: 1.47e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5806 data: 0.0938 lr: 1.29e-05 mem: 47% pow: 663.609 W 0: INFO 26-04-30 02:01:10.590590 - 10:25:51 - step: 41350 acc: 0 loss: 1.3389 grad: 1.63e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5936 data: 0.0849 lr: 1.29e-05 mem: 47% pow: 660.271 W 0: INFO 26-04-30 02:01:24.358494 - 10:26:05 - step: 41360 acc: 0 loss: 1.3143 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5982 data: 0.0904 lr: 1.29e-05 mem: 47% pow: 647.928 W 0: INFO 26-04-30 02:01:37.859010 - 10:26:18 - step: 41370 acc: 0 loss: 1.3341 grad: 1.54e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5982 data: 0.0883 lr: 1.28e-05 mem: 47% pow: 667.599 W 0: INFO 26-04-30 02:01:51.611902 - 10:26:32 - step: 41380 acc: 0 loss: 1.3629 grad: 1.59e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6012 data: 0.0908 lr: 1.28e-05 mem: 47% pow: 655.428 W 0: INFO 26-04-30 02:02:05.227148 - 10:26:46 - step: 41390 acc: 0 loss: 1.834 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6458 data: 0.0817 lr: 1.28e-05 mem: 47% pow: 642.979 W 0: INFO 26-04-30 02:02:18.701865 - 10:26:59 - step: 41400 acc: 0 loss: 1.3045 grad: 1.58e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6095 data: 0.0696 lr: 1.28e-05 mem: 47% pow: 689.412 W 0: INFO 26-04-30 02:02:35.102330 - 10:27:15 - step: 41410 acc: 0 loss: 1.1494 grad: 1.58e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.585 data: 0.1013 lr: 1.28e-05 mem: 54% pow: 655.765 W 0: INFO 26-04-30 02:02:48.509325 - 10:27:29 - step: 41420 acc: 0 loss: 1.2726 grad: 1.55e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6106 data: 0.0862 lr: 1.28e-05 mem: 47% pow: 649.887 W 0: INFO 26-04-30 02:03:02.118195 - 10:27:42 - step: 41430 acc: 0 loss: 1.181 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5826 data: 0.0944 lr: 1.28e-05 mem: 47% pow: 666.177 W 0: INFO 26-04-30 02:03:15.689434 - 10:27:56 - step: 41440 acc: 0 loss: 1.3629 grad: 1.65e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5848 data: 0.0911 lr: 1.27e-05 mem: 47% pow: 663.167 W 0: INFO 26-04-30 02:03:29.392524 - 10:28:10 - step: 41450 acc: 0 loss: 1.2365 grad: 1.57e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5916 data: 0.0883 lr: 1.27e-05 mem: 47% pow: 653.887 W 0: INFO 26-04-30 02:03:42.926210 - 10:28:23 - step: 41460 acc: 0 loss: 1.3914 grad: 1.58e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6135 data: 0.0937 lr: 1.27e-05 mem: 47% pow: 646.426 W 0: INFO 26-04-30 02:03:56.654022 - 10:28:37 - step: 41470 acc: 0 loss: 1.3419 grad: 1.51e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.6156 data: 0.0832 lr: 1.27e-05 mem: 47% pow: 656.376 W 0: INFO 26-04-30 02:04:10.477150 - 10:28:51 - step: 41480 acc: 0 loss: 1.2383 grad: 1.57e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5919 data: 0.0885 lr: 1.27e-05 mem: 47% pow: 659.884 W 0: INFO 26-04-30 02:04:24.076366 - 10:29:04 - step: 41490 acc: 0 loss: 1.3322 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5892 data: 0.091 lr: 1.27e-05 mem: 47% pow: 661.167 W 0: INFO 26-04-30 02:04:37.639296 - 10:29:18 - step: 41500 acc: 0 loss: 1.4396 grad: 1.73e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5834 data: 0.0947 lr: 1.26e-05 mem: 47% pow: 661.105 W 0: INFO 26-04-30 02:04:54.310387 - 10:29:35 - step: 41510 acc: 0 loss: 1.4018 grad: 1.61e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6092 data: 0.0693 lr: 1.26e-05 mem: 54% pow: 656.793 W 0: INFO 26-04-30 02:05:08.044016 - 10:29:48 - step: 41520 acc: 0 loss: 1.1804 grad: 1.58e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5936 data: 0.0892 lr: 1.26e-05 mem: 47% pow: 663.56 W 0: INFO 26-04-30 02:05:21.543088 - 10:30:02 - step: 41530 acc: 0 loss: 1.3758 grad: 1.55e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6038 data: 0.1033 lr: 1.26e-05 mem: 47% pow: 644.435 W 0: INFO 26-04-30 02:05:34.929759 - 10:30:15 - step: 41540 acc: 0 loss: 1.2556 grad: 1.67e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5989 data: 0.0893 lr: 1.26e-05 mem: 47% pow: 663.162 W 0: INFO 26-04-30 02:05:48.410117 - 10:30:29 - step: 41550 acc: 0 loss: 1.4925 grad: 1.63e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6106 data: 0.0838 lr: 1.26e-05 mem: 47% pow: 654.334 W 0: INFO 26-04-30 02:06:01.857994 - 10:30:42 - step: 41560 acc: 0 loss: 1.3096 grad: 1.52e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5913 data: 0.0886 lr: 1.26e-05 mem: 47% pow: 659.64 W 0: INFO 26-04-30 02:06:15.527731 - 10:30:56 - step: 41570 acc: 0 loss: 1.4344 grad: 1.54e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6064 data: 0.0888 lr: 1.25e-05 mem: 47% pow: 654.949 W 0: INFO 26-04-30 02:06:29.151092 - 10:31:09 - step: 41580 acc: 0 loss: 1.4381 grad: 1.58e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5879 data: 0.0872 lr: 1.25e-05 mem: 47% pow: 657.14 W 0: INFO 26-04-30 02:06:42.840729 - 10:31:23 - step: 41590 acc: 0 loss: 1.1394 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5979 data: 0.0948 lr: 1.25e-05 mem: 47% pow: 650.905 W 0: INFO 26-04-30 02:06:56.467123 - 10:31:37 - step: 41600 acc: 0 loss: 1.4715 grad: 1.58e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6086 data: 0.0853 lr: 1.25e-05 mem: 47% pow: 657.631 W 0: INFO 26-04-30 02:07:13.200698 - 10:31:53 - step: 41610 acc: 0 loss: 1.3033 grad: 1.61e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5819 data: 0.0908 lr: 1.25e-05 mem: 54% pow: 660.887 W 0: INFO 26-04-30 02:07:26.938036 - 10:32:07 - step: 41620 acc: 0 loss: 1.3491 grad: 1.62e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6077 data: 0.0694 lr: 1.25e-05 mem: 47% pow: 663.628 W 0: INFO 26-04-30 02:07:40.925172 - 10:32:21 - step: 41630 acc: 0 loss: 1.2826 grad: 1.56e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5997 data: 0.0921 lr: 1.25e-05 mem: 47% pow: 649.6 W 0: INFO 26-04-30 02:07:54.550396 - 10:32:35 - step: 41640 acc: 0 loss: 1.3049 grad: 1.68e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6396 data: 0.0761 lr: 1.24e-05 mem: 47% pow: 639.697 W 0: INFO 26-04-30 02:08:08.217653 - 10:32:49 - step: 41650 acc: 0 loss: 1.1503 grad: 1.55e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5866 data: 0.0907 lr: 1.24e-05 mem: 47% pow: 654.656 W 0: INFO 26-04-30 02:08:22.084211 - 10:33:02 - step: 41660 acc: 0 loss: 1.3853 grad: 1.59e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6304 data: 0.0795 lr: 1.24e-05 mem: 47% pow: 645.988 W 0: INFO 26-04-30 02:08:35.802321 - 10:33:16 - step: 41670 acc: 0 loss: 1.1846 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5869 data: 0.0967 lr: 1.24e-05 mem: 47% pow: 660.537 W 0: INFO 26-04-30 02:08:49.535007 - 10:33:30 - step: 41680 acc: 0 loss: 1.1693 grad: 1.56e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5994 data: 0.091 lr: 1.24e-05 mem: 47% pow: 663.141 W 0: INFO 26-04-30 02:09:03.037217 - 10:33:43 - step: 41690 acc: 0 loss: 1.7105 grad: 1.48e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.611 data: 0.0866 lr: 1.24e-05 mem: 47% pow: 647.247 W 0: INFO 26-04-30 02:09:16.670520 - 10:33:57 - step: 41700 acc: 0 loss: 1.3475 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6 data: 0.092 lr: 1.24e-05 mem: 47% pow: 658.464 W 0: INFO 26-04-30 02:09:33.074003 - 10:34:13 - step: 41710 acc: 0 loss: 1.138 grad: 1.59e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.5879 data: 0.0867 lr: 1.23e-05 mem: 54% pow: 668.467 W 0: INFO 26-04-30 02:09:46.657745 - 10:34:27 - step: 41720 acc: 0 loss: 1.3659 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5897 data: 0.0912 lr: 1.23e-05 mem: 47% pow: 652.009 W 0: INFO 26-04-30 02:10:00.075060 - 10:34:40 - step: 41730 acc: 0 loss: 1.3618 grad: 1.60e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5911 data: 0.0922 lr: 1.23e-05 mem: 47% pow: 661.043 W 0: INFO 26-04-30 02:10:13.552371 - 10:34:54 - step: 41740 acc: 0 loss: 1.4418 grad: 1.62e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5824 data: 0.0941 lr: 1.23e-05 mem: 47% pow: 657.553 W 0: INFO 26-04-30 02:10:26.986349 - 10:35:07 - step: 41750 acc: 0 loss: 1.3237 grad: 1.49e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5879 data: 0.0844 lr: 1.23e-05 mem: 47% pow: 668.491 W 0: INFO 26-04-30 02:10:40.445390 - 10:35:21 - step: 41760 acc: 0 loss: 1.8112 grad: 1.52e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.593 data: 0.0919 lr: 1.23e-05 mem: 47% pow: 670.503 W 0: INFO 26-04-30 02:10:54.204550 - 10:35:35 - step: 41770 acc: 0 loss: 1.0244 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6679 data: 0.075 lr: 1.22e-05 mem: 47% pow: 627.613 W 0: INFO 26-04-30 02:11:07.728526 - 10:35:48 - step: 41780 acc: 0 loss: 1.5909 grad: 1.70e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5874 data: 0.0847 lr: 1.22e-05 mem: 47% pow: 664.152 W 0: INFO 26-04-30 02:11:21.377046 - 10:36:02 - step: 41790 acc: 0 loss: 1.2349 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.595 data: 0.0956 lr: 1.22e-05 mem: 47% pow: 659.708 W 0: INFO 26-04-30 02:11:35.027501 - 10:36:15 - step: 41800 acc: 0 loss: 1.3267 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6504 data: 0.0528 lr: 1.22e-05 mem: 47% pow: 646.491 W 0: INFO 26-04-30 02:11:51.684257 - 10:36:32 - step: 41810 acc: 0 loss: 1.2799 grad: 1.55e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5886 data: 0.0987 lr: 1.22e-05 mem: 54% pow: 661.449 W 0: INFO 26-04-30 02:12:05.041549 - 10:36:45 - step: 41820 acc: 0 loss: 1.2885 grad: 1.58e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6089 data: 0.0866 lr: 1.22e-05 mem: 47% pow: 650.448 W 0: INFO 26-04-30 02:12:18.550072 - 10:36:59 - step: 41830 acc: 0 loss: 1.1546 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6158 data: 0.0958 lr: 1.22e-05 mem: 47% pow: 645.493 W 0: INFO 26-04-30 02:12:32.305922 - 10:37:13 - step: 41840 acc: 0 loss: 1.3526 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6234 data: 0.0892 lr: 1.21e-05 mem: 47% pow: 651.899 W 0: INFO 26-04-30 02:12:45.757396 - 10:37:26 - step: 41850 acc: 0 loss: 1.4905 grad: 1.71e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6097 data: 0.0851 lr: 1.21e-05 mem: 47% pow: 652.566 W 0: INFO 26-04-30 02:12:59.377860 - 10:37:40 - step: 41860 acc: 0 loss: 1.2789 grad: 1.54e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6258 data: 0.0933 lr: 1.21e-05 mem: 47% pow: 641.643 W 0: INFO 26-04-30 02:13:12.857068 - 10:37:53 - step: 41870 acc: 0 loss: 1.327 grad: 1.68e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.592 data: 0.09 lr: 1.21e-05 mem: 47% pow: 667.997 W 0: INFO 26-04-30 02:13:26.439918 - 10:38:07 - step: 41880 acc: 0 loss: 1.343 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5829 data: 0.0959 lr: 1.21e-05 mem: 47% pow: 668.701 W 0: INFO 26-04-30 02:13:40.194365 - 10:38:20 - step: 41890 acc: 0 loss: 1.2228 grad: 1.55e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6315 data: 0.0836 lr: 1.21e-05 mem: 47% pow: 642.246 W 0: INFO 26-04-30 02:13:53.756257 - 10:38:34 - step: 41900 acc: 0 loss: 1.2258 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6054 data: 0.0715 lr: 1.21e-05 mem: 47% pow: 660.257 W 0: INFO 26-04-30 02:14:10.292588 - 10:38:51 - step: 41910 acc: 0 loss: 1.4584 grad: 1.57e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6258 data: 0.0867 lr: 1.20e-05 mem: 54% pow: 642.719 W 0: INFO 26-04-30 02:14:23.878041 - 10:39:04 - step: 41920 acc: 0 loss: 1.4422 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6314 data: 0.0679 lr: 1.20e-05 mem: 47% pow: 653.819 W 0: INFO 26-04-30 02:14:37.713610 - 10:39:18 - step: 41930 acc: 0 loss: 1.6799 grad: 1.59e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6123 data: 0.0817 lr: 1.20e-05 mem: 47% pow: 646.767 W 0: INFO 26-04-30 02:14:51.143426 - 10:39:31 - step: 41940 acc: 0 loss: 1.5252 grad: 1.65e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5976 data: 0.0851 lr: 1.20e-05 mem: 47% pow: 658.198 W 0: INFO 26-04-30 02:15:04.642666 - 10:39:45 - step: 41950 acc: 0 loss: 1.2142 grad: 1.67e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6679 data: 0.0506 lr: 1.20e-05 mem: 47% pow: 630.621 W 0: INFO 26-04-30 02:15:18.323049 - 10:39:59 - step: 41960 acc: 0 loss: 1.1121 grad: 1.57e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.604 data: 0.0808 lr: 1.20e-05 mem: 47% pow: 661.813 W 0: INFO 26-04-30 02:15:31.835433 - 10:40:12 - step: 41970 acc: 0 loss: 1.3034 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5797 data: 0.1132 lr: 1.20e-05 mem: 47% pow: 652.98 W 0: INFO 26-04-30 02:15:45.271378 - 10:40:26 - step: 41980 acc: 0 loss: 1.2384 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5878 data: 0.0877 lr: 1.19e-05 mem: 47% pow: 667.029 W 0: INFO 26-04-30 02:15:58.797114 - 10:40:39 - step: 41990 acc: 0 loss: 1.364 grad: 1.55e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5902 data: 0.0903 lr: 1.19e-05 mem: 47% pow: 659.286 W 0: INFO 26-04-30 02:16:12.135737 - 10:40:52 - step: 42000 acc: 0 loss: 1.2756 grad: 1.60e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5961 data: 0.0845 lr: 1.19e-05 mem: 47% pow: 658.498 W 0: INFO 26-04-30 02:16:15.839481 - 10:40:56 - garbage collection 0: INFO 26-04-30 02:16:30.251334 - 10:41:11 - step: 42010 acc: 0 loss: 1.1003 grad: 1.51e-01 flops: 3.12e+14 wps: 3.62e+04 iter: 0.6015 data: 0.0911 lr: 1.19e-05 mem: 54% pow: 645.959 W 0: INFO 26-04-30 02:16:43.749739 - 10:41:24 - step: 42020 acc: 0 loss: 1.4672 grad: 1.50e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6033 data: 0.0895 lr: 1.19e-05 mem: 47% pow: 649.211 W 0: INFO 26-04-30 02:16:57.140058 - 10:41:37 - step: 42030 acc: 0 loss: 1.5827 grad: 1.64e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.599 data: 0.0754 lr: 1.19e-05 mem: 47% pow: 661.285 W 0: INFO 26-04-30 02:17:10.654191 - 10:41:51 - step: 42040 acc: 0 loss: 1.3182 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6266 data: 0.0681 lr: 1.18e-05 mem: 47% pow: 643.43 W 0: INFO 26-04-30 02:17:24.350261 - 10:42:05 - step: 42050 acc: 0 loss: 1.1822 grad: 1.67e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6074 data: 0.088 lr: 1.18e-05 mem: 47% pow: 643.574 W 0: INFO 26-04-30 02:17:37.883142 - 10:42:18 - step: 42060 acc: 0 loss: 1.2627 grad: 1.62e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5872 data: 0.0951 lr: 1.18e-05 mem: 47% pow: 655.146 W 0: INFO 26-04-30 02:17:51.519032 - 10:42:32 - step: 42070 acc: 0 loss: 1.4978 grad: 1.57e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.601 data: 0.0839 lr: 1.18e-05 mem: 47% pow: 657.427 W 0: INFO 26-04-30 02:18:04.901778 - 10:42:45 - step: 42080 acc: 0 loss: 1.0917 grad: 1.55e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6128 data: 0.0906 lr: 1.18e-05 mem: 47% pow: 643.875 W 0: INFO 26-04-30 02:18:18.432641 - 10:42:59 - step: 42090 acc: 0 loss: 1.4028 grad: 1.77e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5846 data: 0.0933 lr: 1.18e-05 mem: 47% pow: 658.52 W 0: INFO 26-04-30 02:18:32.153064 - 10:43:12 - step: 42100 acc: 0 loss: 1.1736 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6002 data: 0.0869 lr: 1.18e-05 mem: 47% pow: 666.087 W 0: INFO 26-04-30 02:18:48.618318 - 10:43:29 - step: 42110 acc: 0 loss: 1.1515 grad: 1.62e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5893 data: 0.0926 lr: 1.17e-05 mem: 54% pow: 662.744 W 0: INFO 26-04-30 02:19:02.164379 - 10:43:42 - step: 42120 acc: 0 loss: 1.1943 grad: 1.60e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.596 data: 0.0884 lr: 1.17e-05 mem: 47% pow: 667.123 W 0: INFO 26-04-30 02:19:15.609498 - 10:43:56 - step: 42130 acc: 0 loss: 1.2459 grad: 1.55e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5789 data: 0.0894 lr: 1.17e-05 mem: 47% pow: 680.464 W 0: INFO 26-04-30 02:19:29.119083 - 10:44:09 - step: 42140 acc: 0 loss: 1.2621 grad: 1.66e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5908 data: 0.0933 lr: 1.17e-05 mem: 47% pow: 659.666 W 0: INFO 26-04-30 02:19:42.571601 - 10:44:23 - step: 42150 acc: 0 loss: 1.3937 grad: 1.56e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6641 data: 0.0091 lr: 1.17e-05 mem: 47% pow: 670.583 W 0: INFO 26-04-30 02:19:56.130433 - 10:44:36 - step: 42160 acc: 0 loss: 1.4712 grad: 1.52e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.6375 data: 0.0909 lr: 1.17e-05 mem: 47% pow: 633.016 W 0: INFO 26-04-30 02:20:09.871625 - 10:44:50 - step: 42170 acc: 0 loss: 1.2256 grad: 1.76e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6016 data: 0.0871 lr: 1.17e-05 mem: 47% pow: 659.825 W 0: INFO 26-04-30 02:20:23.399337 - 10:45:04 - step: 42180 acc: 0 loss: 1.3181 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5906 data: 0.0934 lr: 1.16e-05 mem: 47% pow: 656.447 W 0: INFO 26-04-30 02:20:36.919236 - 10:45:17 - step: 42190 acc: 0 loss: 1.2855 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5932 data: 0.0845 lr: 1.16e-05 mem: 47% pow: 659.829 W 0: INFO 26-04-30 02:20:50.750639 - 10:45:31 - step: 42200 acc: 0 loss: 1.1484 grad: 1.52e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7918 data: 0.1021 lr: 1.16e-05 mem: 47% pow: 550.159 W 0: INFO 26-04-30 02:21:07.367638 - 10:45:48 - step: 42210 acc: 0 loss: 1.3247 grad: 1.54e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.7255 data: 0.0807 lr: 1.16e-05 mem: 54% pow: 596.452 W 0: INFO 26-04-30 02:21:20.834406 - 10:46:01 - step: 42220 acc: 0 loss: 1.3584 grad: 1.58e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6136 data: 0.0814 lr: 1.16e-05 mem: 47% pow: 649.184 W 0: INFO 26-04-30 02:21:34.434036 - 10:46:15 - step: 42230 acc: 0 loss: 1.1833 grad: 1.66e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6024 data: 0.0892 lr: 1.16e-05 mem: 47% pow: 658.437 W 0: INFO 26-04-30 02:21:48.050416 - 10:46:28 - step: 42240 acc: 0 loss: 1.1467 grad: 1.64e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6001 data: 0.0857 lr: 1.15e-05 mem: 47% pow: 661.716 W 0: INFO 26-04-30 02:22:01.689896 - 10:46:42 - step: 42250 acc: 0 loss: 1.2479 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6038 data: 0.0837 lr: 1.15e-05 mem: 47% pow: 662.558 W 0: INFO 26-04-30 02:22:15.400049 - 10:46:56 - step: 42260 acc: 0 loss: 1.2391 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5849 data: 0.0935 lr: 1.15e-05 mem: 47% pow: 661.214 W 0: INFO 26-04-30 02:22:29.050431 - 10:47:09 - step: 42270 acc: 0 loss: 0.9264 grad: 1.51e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5871 data: 0.0862 lr: 1.15e-05 mem: 47% pow: 663.334 W 0: INFO 26-04-30 02:22:42.497564 - 10:47:23 - step: 42280 acc: 0 loss: 1.3136 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5872 data: 0.0889 lr: 1.15e-05 mem: 47% pow: 667.66 W 0: INFO 26-04-30 02:22:56.074345 - 10:47:36 - step: 42290 acc: 0 loss: 1.1145 grad: 1.58e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6092 data: 0.087 lr: 1.15e-05 mem: 47% pow: 650.201 W 0: INFO 26-04-30 02:23:09.603870 - 10:47:50 - step: 42300 acc: 0 loss: 1.3039 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5971 data: 0.0872 lr: 1.15e-05 mem: 47% pow: 665.506 W 0: INFO 26-04-30 02:23:26.059028 - 10:48:06 - step: 42310 acc: 0 loss: 1.1665 grad: 1.52e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5816 data: 0.0945 lr: 1.14e-05 mem: 54% pow: 661.432 W 0: INFO 26-04-30 02:23:39.457829 - 10:48:20 - step: 42320 acc: 0 loss: 1.3931 grad: 1.64e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.587 data: 0.0926 lr: 1.14e-05 mem: 47% pow: 660.633 W 0: INFO 26-04-30 02:23:52.958424 - 10:48:33 - step: 42330 acc: 0 loss: 1.6273 grad: 1.67e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6128 data: 0.0811 lr: 1.14e-05 mem: 47% pow: 656.446 W 0: INFO 26-04-30 02:24:06.529890 - 10:48:47 - step: 42340 acc: 0 loss: 1.6637 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5811 data: 0.0904 lr: 1.14e-05 mem: 47% pow: 670.397 W 0: INFO 26-04-30 02:24:20.033971 - 10:49:00 - step: 42350 acc: 0 loss: 1.236 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.603 data: 0.0934 lr: 1.14e-05 mem: 47% pow: 657.563 W 0: INFO 26-04-30 02:24:33.446638 - 10:49:14 - step: 42360 acc: 0 loss: 1.4967 grad: 1.56e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5881 data: 0.0838 lr: 1.14e-05 mem: 47% pow: 674.365 W 0: INFO 26-04-30 02:24:46.909333 - 10:49:27 - step: 42370 acc: 0 loss: 1.5117 grad: 1.59e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6061 data: 0.0825 lr: 1.14e-05 mem: 47% pow: 660.308 W 0: INFO 26-04-30 02:25:00.377994 - 10:49:41 - step: 42380 acc: 0 loss: 1.3371 grad: 1.54e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5978 data: 0.0839 lr: 1.13e-05 mem: 47% pow: 657.378 W 0: INFO 26-04-30 02:25:13.745894 - 10:49:54 - step: 42390 acc: 0 loss: 1.2632 grad: 1.59e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5942 data: 0.0892 lr: 1.13e-05 mem: 47% pow: 662.376 W 0: INFO 26-04-30 02:25:27.577650 - 10:50:08 - step: 42400 acc: 0 loss: 1.0255 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5896 data: 0.0922 lr: 1.13e-05 mem: 47% pow: 687.415 W 0: INFO 26-04-30 02:25:43.999480 - 10:50:24 - step: 42410 acc: 0 loss: 1.2361 grad: 1.63e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.5988 data: 0.0826 lr: 1.13e-05 mem: 54% pow: 654.996 W 0: INFO 26-04-30 02:25:57.376340 - 10:50:38 - step: 42420 acc: 0 loss: 1.3876 grad: 1.63e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5943 data: 0.0983 lr: 1.13e-05 mem: 47% pow: 656.35 W 0: INFO 26-04-30 02:26:10.924004 - 10:50:51 - step: 42430 acc: 0 loss: 1.2173 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6098 data: 0.0949 lr: 1.13e-05 mem: 47% pow: 649.299 W 0: INFO 26-04-30 02:26:24.425748 - 10:51:05 - step: 42440 acc: 0 loss: 1.1312 grad: 1.61e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6013 data: 0.0845 lr: 1.13e-05 mem: 47% pow: 660.582 W 0: INFO 26-04-30 02:26:37.993474 - 10:51:18 - step: 42450 acc: 0 loss: 1.1306 grad: 1.72e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5881 data: 0.0876 lr: 1.12e-05 mem: 47% pow: 660.42 W 0: INFO 26-04-30 02:26:51.684259 - 10:51:32 - step: 42460 acc: 0 loss: 1.4594 grad: 1.51e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5979 data: 0.0766 lr: 1.12e-05 mem: 47% pow: 666.999 W 0: INFO 26-04-30 02:27:05.363203 - 10:51:46 - step: 42470 acc: 0 loss: 0.9442 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.587 data: 0.0927 lr: 1.12e-05 mem: 47% pow: 655.673 W 0: INFO 26-04-30 02:27:18.967351 - 10:51:59 - step: 42480 acc: 0 loss: 1.2457 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5986 data: 0.0848 lr: 1.12e-05 mem: 47% pow: 657.033 W 0: INFO 26-04-30 02:27:32.413524 - 10:52:13 - step: 42490 acc: 0 loss: 1.1851 grad: 1.65e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5856 data: 0.0893 lr: 1.12e-05 mem: 47% pow: 663.677 W 0: INFO 26-04-30 02:27:46.207293 - 10:52:27 - step: 42500 acc: 0 loss: 1.4356 grad: 1.60e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6017 data: 0.087 lr: 1.12e-05 mem: 47% pow: 665.208 W 0: INFO 26-04-30 02:28:02.559635 - 10:52:43 - step: 42510 acc: 0 loss: 1.5081 grad: 1.56e-01 flops: 3.46e+14 wps: 4.01e+04 iter: 0.5904 data: 0.086 lr: 1.11e-05 mem: 54% pow: 655.37 W 0: INFO 26-04-30 02:28:16.064696 - 10:52:56 - step: 42520 acc: 0 loss: 1.2158 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.598 data: 0.0874 lr: 1.11e-05 mem: 47% pow: 665.932 W 0: INFO 26-04-30 02:28:29.612411 - 10:53:10 - step: 42530 acc: 0 loss: 1.3582 grad: 1.75e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5796 data: 0.0934 lr: 1.11e-05 mem: 47% pow: 673.068 W 0: INFO 26-04-30 02:28:43.144860 - 10:53:23 - step: 42540 acc: 0 loss: 1.0465 grad: 1.53e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6188 data: 0.0645 lr: 1.11e-05 mem: 47% pow: 661.666 W 0: INFO 26-04-30 02:28:56.733294 - 10:53:37 - step: 42550 acc: 0 loss: 1.2819 grad: 1.58e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6108 data: 0.0635 lr: 1.11e-05 mem: 47% pow: 667.449 W 0: INFO 26-04-30 02:29:10.165419 - 10:53:50 - step: 42560 acc: 0 loss: 1.4202 grad: 1.65e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5848 data: 0.1006 lr: 1.11e-05 mem: 47% pow: 662.263 W 0: INFO 26-04-30 02:29:23.775878 - 10:54:04 - step: 42570 acc: 0 loss: 1.2858 grad: 1.58e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5907 data: 0.0845 lr: 1.11e-05 mem: 47% pow: 664.215 W 0: INFO 26-04-30 02:29:37.415607 - 10:54:18 - step: 42580 acc: 0 loss: 1.1992 grad: 1.62e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6639 data: 0.0914 lr: 1.10e-05 mem: 47% pow: 616.326 W 0: INFO 26-04-30 02:29:51.777971 - 10:54:32 - step: 42590 acc: 0 loss: 1.051 grad: 1.70e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6081 data: 0.0705 lr: 1.10e-05 mem: 47% pow: 661.719 W 0: INFO 26-04-30 02:30:05.361467 - 10:54:46 - step: 42600 acc: 0 loss: 1.305 grad: 1.60e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5781 data: 0.0975 lr: 1.10e-05 mem: 47% pow: 665.49 W 0: INFO 26-04-30 02:30:21.820864 - 10:55:02 - step: 42610 acc: 0 loss: 1.3448 grad: 1.59e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5936 data: 0.0835 lr: 1.10e-05 mem: 54% pow: 663.876 W 0: INFO 26-04-30 02:30:35.363540 - 10:55:16 - step: 42620 acc: 0 loss: 1.3009 grad: 1.59e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6076 data: 0.0937 lr: 1.10e-05 mem: 47% pow: 644.628 W 0: INFO 26-04-30 02:30:48.982215 - 10:55:29 - step: 42630 acc: 0 loss: 1.0905 grad: 1.56e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6303 data: 0.0743 lr: 1.10e-05 mem: 47% pow: 657.343 W 0: INFO 26-04-30 02:31:02.597549 - 10:55:43 - step: 42640 acc: 0 loss: 1.4506 grad: 1.59e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6148 data: 0.0919 lr: 1.10e-05 mem: 47% pow: 632.805 W 0: INFO 26-04-30 02:31:16.122680 - 10:55:56 - step: 42650 acc: 0 loss: 1.3684 grad: 1.57e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.596 data: 0.0876 lr: 1.09e-05 mem: 47% pow: 666.366 W 0: INFO 26-04-30 02:31:29.606878 - 10:56:10 - step: 42660 acc: 0 loss: 1.1403 grad: 1.53e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5952 data: 0.0864 lr: 1.09e-05 mem: 47% pow: 662.974 W 0: INFO 26-04-30 02:31:43.253375 - 10:56:24 - step: 42670 acc: 0 loss: 1.2857 grad: 1.56e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5944 data: 0.0874 lr: 1.09e-05 mem: 47% pow: 658.013 W 0: INFO 26-04-30 02:31:56.783436 - 10:56:37 - step: 42680 acc: 0 loss: 1.3963 grad: 1.70e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5837 data: 0.1344 lr: 1.09e-05 mem: 47% pow: 632.596 W 0: INFO 26-04-30 02:32:10.496512 - 10:56:51 - step: 42690 acc: 0 loss: 1.1941 grad: 1.61e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5964 data: 0.0937 lr: 1.09e-05 mem: 47% pow: 669.237 W 0: INFO 26-04-30 02:32:23.920820 - 10:57:04 - step: 42700 acc: 0 loss: 1.4404 grad: 1.59e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.584 data: 0.0978 lr: 1.09e-05 mem: 47% pow: 658.86 W 0: INFO 26-04-30 02:32:40.386224 - 10:57:21 - step: 42710 acc: 0 loss: 1.0799 grad: 1.58e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.651 data: 0.0923 lr: 1.08e-05 mem: 54% pow: 627.21 W 0: INFO 26-04-30 02:32:53.802999 - 10:57:34 - step: 42720 acc: 0 loss: 1.2216 grad: 1.64e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5953 data: 0.088 lr: 1.08e-05 mem: 47% pow: 660.802 W 0: INFO 26-04-30 02:33:07.429502 - 10:57:48 - step: 42730 acc: 0 loss: 1.2072 grad: 1.53e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5842 data: 0.084 lr: 1.08e-05 mem: 47% pow: 675.565 W 0: INFO 26-04-30 02:33:21.020219 - 10:58:01 - step: 42740 acc: 0 loss: 1.1672 grad: 1.51e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6077 data: 0.0917 lr: 1.08e-05 mem: 47% pow: 651.305 W 0: INFO 26-04-30 02:33:34.442004 - 10:58:15 - step: 42750 acc: 0 loss: 1.6209 grad: 1.62e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5993 data: 0.0916 lr: 1.08e-05 mem: 47% pow: 662.571 W 0: INFO 26-04-30 02:33:47.997540 - 10:58:28 - step: 42760 acc: 0 loss: 1.196 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.7126 data: 0.0771 lr: 1.08e-05 mem: 47% pow: 610.683 W 0: INFO 26-04-30 02:34:01.429888 - 10:58:42 - step: 42770 acc: 0 loss: 1.4097 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.6039 data: 0.0841 lr: 1.08e-05 mem: 47% pow: 661.191 W 0: INFO 26-04-30 02:34:14.869158 - 10:58:55 - step: 42780 acc: 0 loss: 1.2138 grad: 1.51e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5952 data: 0.0839 lr: 1.07e-05 mem: 47% pow: 657.028 W 0: INFO 26-04-30 02:34:28.396424 - 10:59:09 - step: 42790 acc: 0 loss: 1.302 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6024 data: 0.089 lr: 1.07e-05 mem: 47% pow: 658.435 W 0: INFO 26-04-30 02:34:42.027304 - 10:59:22 - step: 42800 acc: 0 loss: 1.2588 grad: 1.57e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.706 data: 0.0909 lr: 1.07e-05 mem: 47% pow: 593.648 W 0: INFO 26-04-30 02:34:58.520537 - 10:59:39 - step: 42810 acc: 0 loss: 1.5316 grad: 1.56e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5928 data: 0.086 lr: 1.07e-05 mem: 54% pow: 658.358 W 0: INFO 26-04-30 02:35:11.931829 - 10:59:52 - step: 42820 acc: 0 loss: 1.4118 grad: 1.61e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6005 data: 0.0811 lr: 1.07e-05 mem: 47% pow: 658.676 W 0: INFO 26-04-30 02:35:25.607595 - 11:00:06 - step: 42830 acc: 0 loss: 1.1394 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5919 data: 0.0919 lr: 1.07e-05 mem: 47% pow: 668.165 W 0: INFO 26-04-30 02:35:39.139120 - 11:00:19 - step: 42840 acc: 0 loss: 0.9226 grad: 1.57e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.5863 data: 0.085 lr: 1.07e-05 mem: 47% pow: 672.827 W 0: INFO 26-04-30 02:35:52.740145 - 11:00:33 - step: 42850 acc: 0 loss: 1.1356 grad: 1.54e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5894 data: 0.0956 lr: 1.06e-05 mem: 47% pow: 665.943 W 0: INFO 26-04-30 02:36:06.096191 - 11:00:46 - step: 42860 acc: 0 loss: 1.2058 grad: 1.59e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5817 data: 0.1112 lr: 1.06e-05 mem: 47% pow: 654.491 W 0: INFO 26-04-30 02:36:19.666233 - 11:01:00 - step: 42870 acc: 0 loss: 1.2061 grad: 1.57e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5796 data: 0.0968 lr: 1.06e-05 mem: 47% pow: 670.799 W 0: INFO 26-04-30 02:36:33.481096 - 11:01:14 - step: 42880 acc: 0 loss: 1.1075 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6073 data: 0.0901 lr: 1.06e-05 mem: 47% pow: 645.727 W 0: INFO 26-04-30 02:36:46.812735 - 11:01:27 - step: 42890 acc: 0 loss: 0.9993 grad: 1.56e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.6069 data: 0.0881 lr: 1.06e-05 mem: 47% pow: 655.529 W 0: INFO 26-04-30 02:37:00.488352 - 11:01:41 - step: 42900 acc: 0 loss: 1.3584 grad: 1.54e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6393 data: 0.0836 lr: 1.06e-05 mem: 47% pow: 642.893 W 0: INFO 26-04-30 02:37:16.981394 - 11:01:57 - step: 42910 acc: 0 loss: 1.1147 grad: 1.52e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5773 data: 0.0976 lr: 1.06e-05 mem: 54% pow: 664.106 W 0: INFO 26-04-30 02:37:30.528038 - 11:02:11 - step: 42920 acc: 0 loss: 1.2374 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6045 data: 0.0965 lr: 1.05e-05 mem: 47% pow: 658.557 W 0: INFO 26-04-30 02:37:43.957132 - 11:02:24 - step: 42930 acc: 0 loss: 1.3225 grad: 1.59e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5915 data: 0.093 lr: 1.05e-05 mem: 47% pow: 664.306 W 0: INFO 26-04-30 02:37:57.396035 - 11:02:38 - step: 42940 acc: 0 loss: 1.3194 grad: 1.54e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5917 data: 0.0878 lr: 1.05e-05 mem: 47% pow: 664.696 W 0: INFO 26-04-30 02:38:11.003751 - 11:02:51 - step: 42950 acc: 0 loss: 1.1272 grad: 1.54e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5811 data: 0.0954 lr: 1.05e-05 mem: 47% pow: 657.484 W 0: INFO 26-04-30 02:38:24.485220 - 11:03:05 - step: 42960 acc: 0 loss: 1.3303 grad: 1.63e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5969 data: 0.0863 lr: 1.05e-05 mem: 47% pow: 662.666 W 0: INFO 26-04-30 02:38:38.312091 - 11:03:19 - step: 42970 acc: 0 loss: 1.1235 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6016 data: 0.0842 lr: 1.05e-05 mem: 47% pow: 668.547 W 0: INFO 26-04-30 02:38:51.863592 - 11:03:32 - step: 42980 acc: 0 loss: 1.3039 grad: 1.55e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.605 data: 0.0903 lr: 1.04e-05 mem: 47% pow: 646.137 W 0: INFO 26-04-30 02:39:05.417505 - 11:03:46 - step: 42990 acc: 0 loss: 1.3232 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5822 data: 0.0885 lr: 1.04e-05 mem: 47% pow: 675.83 W 0: INFO 26-04-30 02:39:18.917841 - 11:03:59 - step: 43000 acc: 0 loss: 1.0525 grad: 1.53e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.5912 data: 0.0931 lr: 1.04e-05 mem: 47% pow: 661.555 W 0: INFO 26-04-30 02:39:22.648527 - 11:04:03 - garbage collection 0: INFO 26-04-30 02:39:37.191370 - 11:04:17 - step: 43010 acc: 0 loss: 1.2239 grad: 1.57e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.6302 data: 0.0937 lr: 1.04e-05 mem: 54% pow: 636.844 W 0: INFO 26-04-30 02:39:50.814539 - 11:04:31 - step: 43020 acc: 0 loss: 1.2508 grad: 1.56e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5958 data: 0.0844 lr: 1.04e-05 mem: 47% pow: 673.451 W 0: INFO 26-04-30 02:40:04.352304 - 11:04:45 - step: 43030 acc: 0 loss: 1.1361 grad: 1.66e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6058 data: 0.0916 lr: 1.04e-05 mem: 47% pow: 650.578 W 0: INFO 26-04-30 02:40:17.883482 - 11:04:58 - step: 43040 acc: 0 loss: 1.2768 grad: 1.57e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6 data: 0.0923 lr: 1.04e-05 mem: 47% pow: 667.954 W 0: INFO 26-04-30 02:40:31.353832 - 11:05:12 - step: 43050 acc: 0 loss: 1.3379 grad: 1.55e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6047 data: 0.0899 lr: 1.03e-05 mem: 47% pow: 653.276 W 0: INFO 26-04-30 02:40:45.078896 - 11:05:25 - step: 43060 acc: 0 loss: 1.5088 grad: 1.57e-01 flops: 4.11e+14 wps: 4.78e+04 iter: 0.5789 data: 0.0925 lr: 1.03e-05 mem: 47% pow: 665.0 W 0: INFO 26-04-30 02:40:58.554387 - 11:05:39 - step: 43070 acc: 0 loss: 1.1034 grad: 1.89e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.595 data: 0.0863 lr: 1.03e-05 mem: 47% pow: 682.291 W 0: INFO 26-04-30 02:41:12.101846 - 11:05:52 - step: 43080 acc: 0 loss: 1.3875 grad: 1.58e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.596 data: 0.0936 lr: 1.03e-05 mem: 47% pow: 652.102 W 0: INFO 26-04-30 02:41:25.615402 - 11:06:06 - step: 43090 acc: 0 loss: 1.3855 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5962 data: 0.0847 lr: 1.03e-05 mem: 47% pow: 657.237 W 0: INFO 26-04-30 02:41:39.251044 - 11:06:20 - step: 43100 acc: 0 loss: 1.2038 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.594 data: 0.0873 lr: 1.03e-05 mem: 47% pow: 659.768 W 0: INFO 26-04-30 02:41:55.733288 - 11:06:36 - step: 43110 acc: 0 loss: 1.1238 grad: 1.58e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5896 data: 0.0934 lr: 1.03e-05 mem: 54% pow: 660.751 W 0: INFO 26-04-30 02:42:09.644514 - 11:06:50 - step: 43120 acc: 0 loss: 1.3312 grad: 1.65e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5996 data: 0.0873 lr: 1.02e-05 mem: 47% pow: 674.018 W 0: INFO 26-04-30 02:42:23.233679 - 11:07:04 - step: 43130 acc: 0 loss: 1.1468 grad: 1.55e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.7306 data: 0.0896 lr: 1.02e-05 mem: 47% pow: 585.364 W 0: INFO 26-04-30 02:42:36.698482 - 11:07:17 - step: 43140 acc: 0 loss: 1.568 grad: 1.51e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5957 data: 0.088 lr: 1.02e-05 mem: 47% pow: 663.641 W 0: INFO 26-04-30 02:42:50.486224 - 11:07:31 - step: 43150 acc: 0 loss: 1.5365 grad: 1.50e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.5866 data: 0.0899 lr: 1.02e-05 mem: 47% pow: 668.72 W 0: INFO 26-04-30 02:43:03.954097 - 11:07:44 - step: 43160 acc: 0 loss: 1.4518 grad: 1.55e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6029 data: 0.0882 lr: 1.02e-05 mem: 47% pow: 659.589 W 0: INFO 26-04-30 02:43:17.462616 - 11:07:58 - step: 43170 acc: 0 loss: 1.3865 grad: 1.64e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.608 data: 0.083 lr: 1.02e-05 mem: 47% pow: 656.767 W 0: INFO 26-04-30 02:43:31.030190 - 11:08:11 - step: 43180 acc: 0 loss: 1.7112 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.578 data: 0.0969 lr: 1.01e-05 mem: 47% pow: 674.292 W 0: INFO 26-04-30 02:43:44.734425 - 11:08:25 - step: 43190 acc: 0 loss: 1.2442 grad: 1.55e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.742 data: 0.0983 lr: 1.01e-05 mem: 47% pow: 571.626 W 0: INFO 26-04-30 02:43:58.377519 - 11:08:39 - step: 43200 acc: 0 loss: 1.154 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6095 data: 0.0914 lr: 1.01e-05 mem: 47% pow: 645.276 W 0: INFO 26-04-30 02:44:14.657397 - 11:08:55 - step: 43210 acc: 0 loss: 1.0727 grad: 1.56e-01 flops: 3.47e+14 wps: 4.03e+04 iter: 0.5909 data: 0.0912 lr: 1.01e-05 mem: 54% pow: 661.964 W 0: INFO 26-04-30 02:44:28.402143 - 11:09:09 - step: 43220 acc: 0 loss: 1.4921 grad: 1.60e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6022 data: 0.0877 lr: 1.01e-05 mem: 47% pow: 666.415 W 0: INFO 26-04-30 02:44:41.863523 - 11:09:22 - step: 43230 acc: 0 loss: 1.373 grad: 1.62e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5971 data: 0.0838 lr: 1.01e-05 mem: 47% pow: 652.894 W 0: INFO 26-04-30 02:44:55.382799 - 11:09:36 - step: 43240 acc: 0 loss: 1.3637 grad: 1.65e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5977 data: 0.0754 lr: 1.01e-05 mem: 47% pow: 667.925 W 0: INFO 26-04-30 02:45:08.838728 - 11:09:49 - step: 43250 acc: 0 loss: 1.5893 grad: 1.65e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.579 data: 0.091 lr: 1.00e-05 mem: 47% pow: 678.367 W 0: INFO 26-04-30 02:45:22.430179 - 11:10:03 - step: 43260 acc: 0 loss: 1.2531 grad: 1.60e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5845 data: 0.093 lr: 1.00e-05 mem: 47% pow: 656.407 W 0: INFO 26-04-30 02:45:35.780194 - 11:10:16 - step: 43270 acc: 0 loss: 1.4823 grad: 1.74e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6204 data: 0.0864 lr: 1.00e-05 mem: 47% pow: 646.688 W 0: INFO 26-04-30 02:45:49.393337 - 11:10:30 - step: 43280 acc: 0 loss: 1.5496 grad: 1.63e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6011 data: 0.0852 lr: 1.00e-05 mem: 47% pow: 675.605 W 0: INFO 26-04-30 02:46:02.718538 - 11:10:43 - step: 43290 acc: 0 loss: 1.1486 grad: 1.57e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.5798 data: 0.1053 lr: 9.99e-06 mem: 47% pow: 663.247 W 0: INFO 26-04-30 02:46:16.332673 - 11:10:57 - step: 43300 acc: 0 loss: 1.5381 grad: 1.60e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5911 data: 0.0887 lr: 9.97e-06 mem: 47% pow: 660.836 W 0: INFO 26-04-30 02:46:32.772274 - 11:11:13 - step: 43310 acc: 0 loss: 1.2201 grad: 1.60e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.5978 data: 0.0821 lr: 9.96e-06 mem: 54% pow: 661.857 W 0: INFO 26-04-30 02:46:46.211391 - 11:11:27 - step: 43320 acc: 0 loss: 1.1884 grad: 1.55e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5908 data: 0.0915 lr: 9.94e-06 mem: 47% pow: 663.778 W 0: INFO 26-04-30 02:46:59.817457 - 11:11:40 - step: 43330 acc: 0 loss: 1.2374 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6152 data: 0.0879 lr: 9.93e-06 mem: 47% pow: 650.992 W 0: INFO 26-04-30 02:47:13.213081 - 11:11:54 - step: 43340 acc: 0 loss: 1.2679 grad: 1.49e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5869 data: 0.0916 lr: 9.91e-06 mem: 47% pow: 657.782 W 0: INFO 26-04-30 02:47:26.667226 - 11:12:07 - step: 43350 acc: 0 loss: 1.1168 grad: 1.61e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6176 data: 0.0885 lr: 9.90e-06 mem: 47% pow: 664.201 W 0: INFO 26-04-30 02:47:40.024374 - 11:12:20 - step: 43360 acc: 0 loss: 1.1415 grad: 1.54e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5902 data: 0.0927 lr: 9.88e-06 mem: 47% pow: 663.582 W 0: INFO 26-04-30 02:47:53.500402 - 11:12:34 - step: 43370 acc: 0 loss: 1.0105 grad: 1.57e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5975 data: 0.0838 lr: 9.87e-06 mem: 47% pow: 657.729 W 0: INFO 26-04-30 02:48:07.053401 - 11:12:47 - step: 43380 acc: 0 loss: 1.3836 grad: 1.51e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5809 data: 0.0932 lr: 9.85e-06 mem: 47% pow: 662.828 W 0: INFO 26-04-30 02:48:20.448750 - 11:13:01 - step: 43390 acc: 0 loss: 1.0549 grad: 1.56e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.603 data: 0.0876 lr: 9.84e-06 mem: 47% pow: 659.819 W 0: INFO 26-04-30 02:48:33.916369 - 11:13:14 - step: 43400 acc: 0 loss: 1.0619 grad: 1.53e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6184 data: 0.0628 lr: 9.82e-06 mem: 47% pow: 673.129 W 0: INFO 26-04-30 02:48:50.636176 - 11:13:31 - step: 43410 acc: 0 loss: 1.5408 grad: 1.60e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.5957 data: 0.0764 lr: 9.81e-06 mem: 54% pow: 669.045 W 0: INFO 26-04-30 02:49:04.206176 - 11:13:45 - step: 43420 acc: 0 loss: 1.4195 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5767 data: 0.097 lr: 9.79e-06 mem: 47% pow: 672.298 W 0: INFO 26-04-30 02:49:17.960431 - 11:13:58 - step: 43430 acc: 0 loss: 1.4268 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6105 data: 0.0893 lr: 9.78e-06 mem: 47% pow: 653.673 W 0: INFO 26-04-30 02:49:31.505028 - 11:14:12 - step: 43440 acc: 0 loss: 1.1385 grad: 1.81e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6161 data: 0.0885 lr: 9.76e-06 mem: 47% pow: 660.114 W 0: INFO 26-04-30 02:49:44.963582 - 11:14:25 - step: 43450 acc: 0 loss: 1.1483 grad: 1.63e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5904 data: 0.0919 lr: 9.75e-06 mem: 47% pow: 657.268 W 0: INFO 26-04-30 02:49:58.449040 - 11:14:39 - step: 43460 acc: 0 loss: 1.173 grad: 1.61e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.667 data: 0.0898 lr: 9.73e-06 mem: 47% pow: 609.667 W 0: INFO 26-04-30 02:50:12.036242 - 11:14:52 - step: 43470 acc: 0 loss: 1.0121 grad: 1.69e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6155 data: 0.0962 lr: 9.72e-06 mem: 47% pow: 643.457 W 0: INFO 26-04-30 02:50:25.617331 - 11:15:06 - step: 43480 acc: 0 loss: 0.9581 grad: 1.56e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5928 data: 0.0884 lr: 9.70e-06 mem: 47% pow: 664.616 W 0: INFO 26-04-30 02:50:39.175211 - 11:15:19 - step: 43490 acc: 0 loss: 1.1182 grad: 1.59e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5966 data: 0.0843 lr: 9.69e-06 mem: 47% pow: 655.251 W 0: INFO 26-04-30 02:50:59.078073 - 11:15:39 - step: 43500 acc: 0 loss: 1.3622 grad: 1.54e-01 flops: 2.84e+14 wps: 3.29e+04 iter: 0.5986 data: 0.0768 lr: 9.67e-06 mem: 47% pow: 658.455 W 0: INFO 26-04-30 02:51:15.443661 - 11:15:56 - step: 43510 acc: 0 loss: 1.3224 grad: 1.49e-01 flops: 3.45e+14 wps: 4.01e+04 iter: 0.5859 data: 0.0959 lr: 9.66e-06 mem: 54% pow: 653.081 W 0: INFO 26-04-30 02:51:29.058216 - 11:16:09 - step: 43520 acc: 0 loss: 1.2159 grad: 1.56e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6141 data: 0.0804 lr: 9.64e-06 mem: 47% pow: 645.279 W 0: INFO 26-04-30 02:51:42.770739 - 11:16:23 - step: 43530 acc: 0 loss: 1.3983 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5869 data: 0.0892 lr: 9.63e-06 mem: 47% pow: 669.648 W 0: INFO 26-04-30 02:51:56.127327 - 11:16:36 - step: 43540 acc: 0 loss: 1.4899 grad: 1.63e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.6089 data: 0.083 lr: 9.61e-06 mem: 47% pow: 654.612 W 0: INFO 26-04-30 02:52:09.841516 - 11:16:50 - step: 43550 acc: 0 loss: 1.0397 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5944 data: 0.0883 lr: 9.60e-06 mem: 47% pow: 664.73 W 0: INFO 26-04-30 02:52:23.225669 - 11:17:04 - step: 43560 acc: 0 loss: 1.2612 grad: 1.55e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6191 data: 0.0851 lr: 9.58e-06 mem: 47% pow: 651.0 W 0: INFO 26-04-30 02:52:36.796375 - 11:17:17 - step: 43570 acc: 0 loss: 1.2979 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6053 data: 0.0876 lr: 9.57e-06 mem: 47% pow: 660.345 W 0: INFO 26-04-30 02:52:50.288916 - 11:17:31 - step: 43580 acc: 0 loss: 1.3318 grad: 1.60e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6429 data: 0.0968 lr: 9.55e-06 mem: 47% pow: 650.768 W 0: INFO 26-04-30 02:53:03.705922 - 11:17:44 - step: 43590 acc: 0 loss: 1.0744 grad: 1.57e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5983 data: 0.0847 lr: 9.54e-06 mem: 47% pow: 658.525 W 0: INFO 26-04-30 02:53:17.249734 - 11:17:58 - step: 43600 acc: 0 loss: 1.3534 grad: 1.48e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6116 data: 0.0909 lr: 9.52e-06 mem: 47% pow: 644.055 W 0: INFO 26-04-30 02:53:33.829900 - 11:18:14 - step: 43610 acc: 0 loss: 1.1097 grad: 1.58e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6022 data: 0.0872 lr: 9.51e-06 mem: 54% pow: 658.6 W 0: INFO 26-04-30 02:53:47.246982 - 11:18:28 - step: 43620 acc: 0 loss: 1.1405 grad: 1.54e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5983 data: 0.0921 lr: 9.49e-06 mem: 47% pow: 667.514 W 0: INFO 26-04-30 02:54:00.889152 - 11:18:41 - step: 43630 acc: 0 loss: 1.4288 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5834 data: 0.0892 lr: 9.48e-06 mem: 47% pow: 668.456 W 0: INFO 26-04-30 02:54:14.341185 - 11:18:55 - step: 43640 acc: 0 loss: 1.2152 grad: 1.55e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5862 data: 0.0868 lr: 9.47e-06 mem: 47% pow: 675.493 W 0: INFO 26-04-30 02:54:27.719606 - 11:19:08 - step: 43650 acc: 0 loss: 1.2651 grad: 1.48e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5983 data: 0.0817 lr: 9.45e-06 mem: 47% pow: 664.995 W 0: INFO 26-04-30 02:54:42.576114 - 11:19:23 - step: 43660 acc: 0 loss: 1.3976 grad: 1.54e-01 flops: 3.80e+14 wps: 4.42e+04 iter: 0.6059 data: 0.0792 lr: 9.44e-06 mem: 47% pow: 657.068 W 0: INFO 26-04-30 02:54:56.147423 - 11:19:36 - step: 43670 acc: 0 loss: 1.5694 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.598 data: 0.0835 lr: 9.42e-06 mem: 47% pow: 661.437 W 0: INFO 26-04-30 02:55:09.709746 - 11:19:50 - step: 43680 acc: 0 loss: 1.3879 grad: 1.52e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6036 data: 0.0788 lr: 9.41e-06 mem: 47% pow: 656.093 W 0: INFO 26-04-30 02:55:24.762303 - 11:20:05 - step: 43690 acc: 0 loss: 1.7463 grad: 1.45e-01 flops: 3.75e+14 wps: 4.35e+04 iter: 0.5961 data: 0.0876 lr: 9.39e-06 mem: 47% pow: 659.835 W 0: INFO 26-04-30 02:55:38.393968 - 11:20:19 - step: 43700 acc: 0 loss: 1.156 grad: 1.53e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6278 data: 0.0826 lr: 9.38e-06 mem: 47% pow: 643.527 W 0: INFO 26-04-30 02:55:54.786672 - 11:20:35 - step: 43710 acc: 0 loss: 1.2616 grad: 1.52e-01 flops: 3.45e+14 wps: 4.00e+04 iter: 0.5991 data: 0.0895 lr: 9.36e-06 mem: 54% pow: 658.361 W 0: INFO 26-04-30 02:56:08.303007 - 11:20:49 - step: 43720 acc: 0 loss: 1.1667 grad: 1.52e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6008 data: 0.084 lr: 9.35e-06 mem: 47% pow: 664.59 W 0: INFO 26-04-30 02:56:21.796496 - 11:21:02 - step: 43730 acc: 0 loss: 1.4034 grad: 1.57e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5825 data: 0.0915 lr: 9.33e-06 mem: 47% pow: 664.415 W 0: INFO 26-04-30 02:56:35.265400 - 11:21:16 - step: 43740 acc: 0 loss: 1.3934 grad: 1.62e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5955 data: 0.0909 lr: 9.32e-06 mem: 47% pow: 661.692 W 0: INFO 26-04-30 02:56:48.693684 - 11:21:29 - step: 43750 acc: 0 loss: 1.5945 grad: 1.55e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5962 data: 0.0913 lr: 9.30e-06 mem: 47% pow: 653.623 W 0: INFO 26-04-30 02:57:02.152138 - 11:21:42 - step: 43760 acc: 0 loss: 1.293 grad: 1.56e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.6268 data: 0.0835 lr: 9.29e-06 mem: 47% pow: 643.262 W 0: INFO 26-04-30 02:57:15.431472 - 11:21:56 - step: 43770 acc: 0 loss: 1.4341 grad: 1.53e-01 flops: 4.26e+14 wps: 4.94e+04 iter: 0.5971 data: 0.085 lr: 9.27e-06 mem: 47% pow: 668.025 W 0: INFO 26-04-30 02:57:28.897249 - 11:22:09 - step: 43780 acc: 0 loss: 1.2443 grad: 1.49e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5904 data: 0.087 lr: 9.26e-06 mem: 47% pow: 661.515 W 0: INFO 26-04-30 02:57:42.421006 - 11:22:23 - step: 43790 acc: 0 loss: 1.2721 grad: 1.63e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.613 data: 0.0787 lr: 9.24e-06 mem: 47% pow: 664.036 W 0: INFO 26-04-30 02:57:56.266081 - 11:22:37 - step: 43800 acc: 0 loss: 1.1967 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5801 data: 0.0878 lr: 9.23e-06 mem: 47% pow: 675.062 W 0: INFO 26-04-30 02:58:12.885405 - 11:22:53 - step: 43810 acc: 0 loss: 1.3311 grad: 1.54e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6079 data: 0.0955 lr: 9.21e-06 mem: 54% pow: 656.522 W 0: INFO 26-04-30 02:58:26.369261 - 11:23:07 - step: 43820 acc: 0 loss: 0.9633 grad: 1.54e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5877 data: 0.0968 lr: 9.20e-06 mem: 47% pow: 661.316 W 0: INFO 26-04-30 02:58:39.849477 - 11:23:20 - step: 43830 acc: 0 loss: 1.5399 grad: 1.53e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6324 data: 0.0915 lr: 9.18e-06 mem: 47% pow: 644.504 W 0: INFO 26-04-30 02:58:53.520839 - 11:23:34 - step: 43840 acc: 0 loss: 1.2715 grad: 1.58e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6272 data: 0.0704 lr: 9.17e-06 mem: 47% pow: 657.929 W 0: INFO 26-04-30 02:59:06.957734 - 11:23:47 - step: 43850 acc: 0 loss: 1.0603 grad: 1.63e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5814 data: 0.0918 lr: 9.15e-06 mem: 47% pow: 661.079 W 0: INFO 26-04-30 02:59:22.132679 - 11:24:02 - step: 43860 acc: 0 loss: 1.1094 grad: 1.56e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.5878 data: 0.091 lr: 9.14e-06 mem: 47% pow: 668.195 W 0: INFO 26-04-30 02:59:36.435158 - 11:24:17 - step: 43870 acc: 0 loss: 1.2245 grad: 1.66e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.6033 data: 0.087 lr: 9.12e-06 mem: 47% pow: 657.347 W 0: INFO 26-04-30 02:59:49.909721 - 11:24:30 - step: 43880 acc: 0 loss: 1.2728 grad: 1.55e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6033 data: 0.0838 lr: 9.11e-06 mem: 47% pow: 659.634 W 0: INFO 26-04-30 03:00:03.675173 - 11:24:44 - step: 43890 acc: 0 loss: 1.4433 grad: 1.45e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6695 data: 0.0801 lr: 9.09e-06 mem: 47% pow: 639.759 W 0: INFO 26-04-30 03:00:17.471432 - 11:24:58 - step: 43900 acc: 0 loss: 1.3476 grad: 1.55e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5808 data: 0.0917 lr: 9.08e-06 mem: 47% pow: 667.631 W 0: INFO 26-04-30 03:00:34.956872 - 11:25:15 - step: 43910 acc: 0 loss: 1.5533 grad: 1.58e-01 flops: 3.23e+14 wps: 3.75e+04 iter: 0.6037 data: 0.0873 lr: 9.06e-06 mem: 54% pow: 660.94 W 0: INFO 26-04-30 03:00:48.572736 - 11:25:29 - step: 43920 acc: 0 loss: 1.1821 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.613 data: 0.0911 lr: 9.05e-06 mem: 47% pow: 653.415 W 0: INFO 26-04-30 03:01:02.003305 - 11:25:42 - step: 43930 acc: 0 loss: 1.1351 grad: 1.55e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.591 data: 0.0913 lr: 9.03e-06 mem: 47% pow: 662.429 W 0: INFO 26-04-30 03:01:16.024443 - 11:25:56 - step: 43940 acc: 0 loss: 1.3542 grad: 1.49e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5867 data: 0.0955 lr: 9.02e-06 mem: 47% pow: 657.488 W 0: INFO 26-04-30 03:01:29.451332 - 11:26:10 - step: 43950 acc: 0 loss: 1.3054 grad: 1.53e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5893 data: 0.0926 lr: 9.00e-06 mem: 47% pow: 661.479 W 0: INFO 26-04-30 03:01:43.228560 - 11:26:24 - step: 43960 acc: 0 loss: 1.5749 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6361 data: 0.0902 lr: 8.99e-06 mem: 47% pow: 636.787 W 0: INFO 26-04-30 03:01:56.865981 - 11:26:37 - step: 43970 acc: 0 loss: 1.2679 grad: 1.54e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5973 data: 0.0851 lr: 8.97e-06 mem: 47% pow: 658.744 W 0: INFO 26-04-30 03:02:11.140354 - 11:26:51 - step: 43980 acc: 0 loss: 1.4317 grad: 1.49e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.72 data: 0.0943 lr: 8.96e-06 mem: 47% pow: 588.894 W 0: INFO 26-04-30 03:02:24.720392 - 11:27:05 - step: 43990 acc: 0 loss: 1.1799 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5936 data: 0.0864 lr: 8.94e-06 mem: 47% pow: 655.833 W 0: INFO 26-04-30 03:02:38.414903 - 11:27:19 - step: 44000 acc: 0 loss: 1.119 grad: 1.59e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5933 data: 0.0889 lr: 8.93e-06 mem: 47% pow: 658.187 W 0: INFO 26-04-30 03:02:42.144275 - 11:27:22 - garbage collection 0: INFO 26-04-30 03:02:57.149617 - 11:27:37 - step: 44010 acc: 0 loss: 1.0593 grad: 1.51e-01 flops: 3.01e+14 wps: 3.50e+04 iter: 0.7962 data: 0.0868 lr: 8.91e-06 mem: 54% pow: 547.985 W 0: INFO 26-04-30 03:03:10.963759 - 11:27:51 - step: 44020 acc: 0 loss: 1.0801 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5919 data: 0.09 lr: 8.90e-06 mem: 47% pow: 655.898 W 0: INFO 26-04-30 03:03:24.806602 - 11:28:05 - step: 44030 acc: 0 loss: 1.3773 grad: 1.64e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5955 data: 0.0887 lr: 8.88e-06 mem: 47% pow: 660.114 W 0: INFO 26-04-30 03:03:40.274680 - 11:28:21 - step: 44040 acc: 0 loss: 1.4878 grad: 1.62e-01 flops: 3.65e+14 wps: 4.24e+04 iter: 0.6098 data: 0.0811 lr: 8.87e-06 mem: 47% pow: 656.033 W 0: INFO 26-04-30 03:03:54.107379 - 11:28:34 - step: 44050 acc: 0 loss: 1.4749 grad: 1.45e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6203 data: 0.0846 lr: 8.86e-06 mem: 47% pow: 648.231 W 0: INFO 26-04-30 03:04:08.014078 - 11:28:48 - step: 44060 acc: 0 loss: 1.3958 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5814 data: 0.0898 lr: 8.84e-06 mem: 47% pow: 673.246 W 0: INFO 26-04-30 03:04:21.758862 - 11:29:02 - step: 44070 acc: 0 loss: 1.5562 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.8151 data: 0.0962 lr: 8.83e-06 mem: 47% pow: 534.35 W 0: INFO 26-04-30 03:04:36.936247 - 11:29:17 - step: 44080 acc: 0 loss: 1.6235 grad: 1.60e-01 flops: 3.72e+14 wps: 4.32e+04 iter: 0.6041 data: 0.0857 lr: 8.81e-06 mem: 47% pow: 657.459 W 0: INFO 26-04-30 03:04:50.753848 - 11:29:31 - step: 44090 acc: 0 loss: 1.5816 grad: 1.60e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6129 data: 0.0933 lr: 8.80e-06 mem: 47% pow: 658.06 W 0: INFO 26-04-30 03:05:04.551449 - 11:29:45 - step: 44100 acc: 0 loss: 1.5981 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6107 data: 0.0925 lr: 8.78e-06 mem: 47% pow: 650.559 W 0: INFO 26-04-30 03:05:21.383559 - 11:30:02 - step: 44110 acc: 0 loss: 1.2679 grad: 1.50e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5832 data: 0.0908 lr: 8.77e-06 mem: 54% pow: 660.876 W 0: INFO 26-04-30 03:05:35.272553 - 11:30:16 - step: 44120 acc: 0 loss: 1.5236 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6777 data: 0.0886 lr: 8.75e-06 mem: 47% pow: 621.119 W 0: INFO 26-04-30 03:05:48.973811 - 11:30:29 - step: 44130 acc: 0 loss: 1.2654 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6092 data: 0.084 lr: 8.74e-06 mem: 47% pow: 653.686 W 0: INFO 26-04-30 03:06:03.910947 - 11:30:44 - step: 44140 acc: 0 loss: 1.4084 grad: 1.42e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 0.6035 data: 0.0821 lr: 8.72e-06 mem: 47% pow: 664.519 W 0: INFO 26-04-30 03:06:17.608547 - 11:30:58 - step: 44150 acc: 0 loss: 0.8738 grad: 1.52e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.7151 data: 0.0912 lr: 8.71e-06 mem: 47% pow: 595.546 W 0: INFO 26-04-30 03:06:31.929302 - 11:31:12 - step: 44160 acc: 0 loss: 1.4574 grad: 1.46e-01 flops: 3.95e+14 wps: 4.58e+04 iter: 0.5883 data: 0.0932 lr: 8.69e-06 mem: 47% pow: 659.364 W 0: INFO 26-04-30 03:06:45.639797 - 11:31:26 - step: 44170 acc: 0 loss: 1.5474 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6649 data: 0.0846 lr: 8.68e-06 mem: 47% pow: 627.29 W 0: INFO 26-04-30 03:06:59.313201 - 11:31:40 - step: 44180 acc: 0 loss: 1.316 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5791 data: 0.0933 lr: 8.66e-06 mem: 47% pow: 658.671 W 0: INFO 26-04-30 03:07:13.271284 - 11:31:54 - step: 44190 acc: 0 loss: 1.3756 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5907 data: 0.0896 lr: 8.65e-06 mem: 47% pow: 672.277 W 0: INFO 26-04-30 03:07:28.205466 - 11:32:09 - step: 44200 acc: 0 loss: 1.3562 grad: 1.46e-01 flops: 3.78e+14 wps: 4.39e+04 iter: 1.5339 data: 0.0892 lr: 8.63e-06 mem: 47% pow: 459.026 W 0: INFO 26-04-30 03:07:44.740392 - 11:32:25 - step: 44210 acc: 0 loss: 1.2681 grad: 1.47e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6198 data: 0.0927 lr: 8.62e-06 mem: 54% pow: 644.795 W 0: INFO 26-04-30 03:07:58.893016 - 11:32:39 - step: 44220 acc: 0 loss: 1.5812 grad: 1.51e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5837 data: 0.0889 lr: 8.60e-06 mem: 47% pow: 659.862 W 0: INFO 26-04-30 03:08:12.621141 - 11:32:53 - step: 44230 acc: 0 loss: 1.3198 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5852 data: 0.0909 lr: 8.59e-06 mem: 47% pow: 668.172 W 0: INFO 26-04-30 03:08:26.751033 - 11:33:07 - step: 44240 acc: 0 loss: 1.3418 grad: 1.45e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.5799 data: 0.0906 lr: 8.57e-06 mem: 47% pow: 674.524 W 0: INFO 26-04-30 03:08:42.018915 - 11:33:22 - step: 44250 acc: 0 loss: 1.1757 grad: 1.48e-01 flops: 3.70e+14 wps: 4.29e+04 iter: 0.7275 data: 0.0877 lr: 8.56e-06 mem: 47% pow: 584.24 W 0: INFO 26-04-30 03:08:55.746840 - 11:33:36 - step: 44260 acc: 0 loss: 1.5698 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5932 data: 0.0891 lr: 8.54e-06 mem: 47% pow: 658.741 W 0: INFO 26-04-30 03:09:09.710090 - 11:33:50 - step: 44270 acc: 0 loss: 1.4567 grad: 1.44e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5906 data: 0.094 lr: 8.53e-06 mem: 47% pow: 668.417 W 0: INFO 26-04-30 03:09:23.523374 - 11:34:04 - step: 44280 acc: 0 loss: 0.74 grad: 1.45e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5803 data: 0.0936 lr: 8.51e-06 mem: 47% pow: 655.808 W 0: INFO 26-04-30 03:09:37.706364 - 11:34:18 - step: 44290 acc: 0 loss: 1.3293 grad: 1.45e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.8266 data: 0.0914 lr: 8.50e-06 mem: 47% pow: 527.989 W 0: INFO 26-04-30 03:09:51.649999 - 11:34:32 - step: 44300 acc: 0 loss: 1.5566 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6021 data: 0.0831 lr: 8.48e-06 mem: 47% pow: 670.439 W 0: INFO 26-04-30 03:10:09.584669 - 11:34:50 - step: 44310 acc: 0 loss: 1.6463 grad: 1.45e-01 flops: 3.15e+14 wps: 3.66e+04 iter: 0.5903 data: 0.0877 lr: 8.47e-06 mem: 54% pow: 667.297 W 0: INFO 26-04-30 03:10:23.182017 - 11:35:03 - step: 44320 acc: 0 loss: 1.4268 grad: 1.45e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.595 data: 0.0869 lr: 8.45e-06 mem: 47% pow: 652.719 W 0: INFO 26-04-30 03:10:36.876199 - 11:35:17 - step: 44330 acc: 0 loss: 1.387 grad: 1.43e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6814 data: 0.0754 lr: 8.44e-06 mem: 47% pow: 607.599 W 0: INFO 26-04-30 03:10:50.888717 - 11:35:31 - step: 44340 acc: 0 loss: 1.3187 grad: 1.49e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5806 data: 0.0918 lr: 8.42e-06 mem: 47% pow: 671.801 W 0: INFO 26-04-30 03:11:04.672851 - 11:35:45 - step: 44350 acc: 0 loss: 1.5454 grad: 1.56e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6151 data: 0.0841 lr: 8.41e-06 mem: 47% pow: 653.082 W 0: INFO 26-04-30 03:11:21.727808 - 11:36:02 - step: 44360 acc: 0 loss: 1.2377 grad: 1.46e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.623 data: 0.0878 lr: 8.39e-06 mem: 47% pow: 646.438 W 0: INFO 26-04-30 03:11:35.252703 - 11:36:16 - step: 44370 acc: 0 loss: 1.1926 grad: 1.44e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6122 data: 0.0763 lr: 8.38e-06 mem: 47% pow: 661.297 W 0: INFO 26-04-30 03:11:49.233163 - 11:36:30 - step: 44380 acc: 0 loss: 1.2234 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.72 data: 0.0845 lr: 8.36e-06 mem: 47% pow: 599.431 W 0: INFO 26-04-30 03:12:02.883978 - 11:36:43 - step: 44390 acc: 0 loss: 1.509 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5957 data: 0.0859 lr: 8.35e-06 mem: 47% pow: 658.919 W 0: INFO 26-04-30 03:12:16.674405 - 11:36:57 - step: 44400 acc: 0 loss: 1.3455 grad: 1.65e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5929 data: 0.0817 lr: 8.33e-06 mem: 47% pow: 675.307 W 0: INFO 26-04-30 03:12:33.937491 - 11:37:14 - step: 44410 acc: 0 loss: 1.2141 grad: 1.47e-01 flops: 3.27e+14 wps: 3.80e+04 iter: 0.6464 data: 0.0941 lr: 8.32e-06 mem: 54% pow: 625.677 W 0: INFO 26-04-30 03:12:47.645122 - 11:37:28 - step: 44420 acc: 0 loss: 1.2782 grad: 1.43e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6159 data: 0.09 lr: 8.30e-06 mem: 47% pow: 666.493 W 0: INFO 26-04-30 03:13:01.560643 - 11:37:42 - step: 44430 acc: 0 loss: 1.3048 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5889 data: 0.0926 lr: 8.29e-06 mem: 47% pow: 659.933 W 0: INFO 26-04-30 03:13:15.626746 - 11:37:56 - step: 44440 acc: 0 loss: 1.4939 grad: 1.47e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.6051 data: 0.0781 lr: 8.27e-06 mem: 47% pow: 656.704 W 0: INFO 26-04-30 03:13:31.405901 - 11:38:12 - step: 44450 acc: 0 loss: 1.129 grad: 1.53e-01 flops: 3.58e+14 wps: 4.15e+04 iter: 0.5854 data: 0.0849 lr: 8.26e-06 mem: 47% pow: 684.637 W 0: INFO 26-04-30 03:13:45.739544 - 11:38:26 - step: 44460 acc: 0 loss: 1.283 grad: 1.42e-01 flops: 3.94e+14 wps: 4.58e+04 iter: 0.5823 data: 0.0942 lr: 8.25e-06 mem: 47% pow: 661.827 W 0: INFO 26-04-30 03:14:00.136368 - 11:38:40 - step: 44470 acc: 0 loss: 1.4111 grad: 1.44e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5782 data: 0.1581 lr: 8.23e-06 mem: 47% pow: 624.853 W 0: INFO 26-04-30 03:14:14.124552 - 11:38:54 - step: 44480 acc: 0 loss: 1.3779 grad: 1.50e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5894 data: 0.0915 lr: 8.22e-06 mem: 47% pow: 669.277 W 0: INFO 26-04-30 03:14:28.334022 - 11:39:09 - step: 44490 acc: 0 loss: 1.5146 grad: 1.43e-01 flops: 3.98e+14 wps: 4.61e+04 iter: 0.6063 data: 0.0864 lr: 8.20e-06 mem: 47% pow: 649.199 W 0: INFO 26-04-30 03:14:42.210623 - 11:39:23 - step: 44500 acc: 0 loss: 1.5495 grad: 1.43e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.669 data: 0.0828 lr: 8.19e-06 mem: 47% pow: 624.568 W 0: INFO 26-04-30 03:14:58.637956 - 11:39:39 - step: 44510 acc: 0 loss: 1.1291 grad: 1.47e-01 flops: 3.44e+14 wps: 3.99e+04 iter: 0.5887 data: 0.092 lr: 8.17e-06 mem: 54% pow: 660.368 W 0: INFO 26-04-30 03:15:12.620791 - 11:39:53 - step: 44520 acc: 0 loss: 1.4083 grad: 1.52e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5903 data: 0.0928 lr: 8.16e-06 mem: 47% pow: 657.123 W 0: INFO 26-04-30 03:15:26.170520 - 11:40:06 - step: 44530 acc: 0 loss: 1.2699 grad: 1.41e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5882 data: 0.0821 lr: 8.14e-06 mem: 47% pow: 667.28 W 0: INFO 26-04-30 03:15:40.173515 - 11:40:20 - step: 44540 acc: 0 loss: 1.2943 grad: 1.54e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6021 data: 0.087 lr: 8.13e-06 mem: 47% pow: 654.978 W 0: INFO 26-04-30 03:15:53.887330 - 11:40:34 - step: 44550 acc: 0 loss: 1.3341 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5948 data: 0.0934 lr: 8.11e-06 mem: 47% pow: 666.931 W 0: INFO 26-04-30 03:16:07.715109 - 11:40:48 - step: 44560 acc: 0 loss: 1.3365 grad: 1.61e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6287 data: 0.0879 lr: 8.10e-06 mem: 47% pow: 641.913 W 0: INFO 26-04-30 03:16:21.849140 - 11:41:02 - step: 44570 acc: 0 loss: 1.3729 grad: 1.63e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6235 data: 0.0837 lr: 8.08e-06 mem: 47% pow: 656.262 W 0: INFO 26-04-30 03:16:35.997794 - 11:41:16 - step: 44580 acc: 0 loss: 1.2741 grad: 1.49e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.5858 data: 0.087 lr: 8.07e-06 mem: 47% pow: 669.012 W 0: INFO 26-04-30 03:16:53.224954 - 11:41:34 - step: 44590 acc: 0 loss: 1.3256 grad: 1.49e-01 flops: 3.28e+14 wps: 3.80e+04 iter: 0.583 data: 0.0877 lr: 8.05e-06 mem: 47% pow: 671.023 W 0: INFO 26-04-30 03:17:09.168721 - 11:41:49 - step: 44600 acc: 0 loss: 1.5217 grad: 1.48e-01 flops: 3.54e+14 wps: 4.11e+04 iter: 0.5796 data: 0.0926 lr: 8.04e-06 mem: 47% pow: 662.072 W 0: INFO 26-04-30 03:17:25.799786 - 11:42:06 - step: 44610 acc: 0 loss: 1.6699 grad: 1.50e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6406 data: 0.0771 lr: 8.02e-06 mem: 54% pow: 634.604 W 0: INFO 26-04-30 03:17:39.910142 - 11:42:20 - step: 44620 acc: 0 loss: 1.7185 grad: 1.47e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.6203 data: 0.0909 lr: 8.01e-06 mem: 47% pow: 639.64 W 0: INFO 26-04-30 03:17:53.689624 - 11:42:34 - step: 44630 acc: 0 loss: 1.4026 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6307 data: 0.1042 lr: 7.99e-06 mem: 47% pow: 622.742 W 0: INFO 26-04-30 03:18:07.470304 - 11:42:48 - step: 44640 acc: 0 loss: 1.343 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6241 data: 0.0851 lr: 7.98e-06 mem: 47% pow: 645.437 W 0: INFO 26-04-30 03:18:21.325660 - 11:43:02 - step: 44650 acc: 0 loss: 1.2733 grad: 1.49e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.7527 data: 0.0947 lr: 7.96e-06 mem: 47% pow: 573.58 W 0: INFO 26-04-30 03:18:35.271976 - 11:43:16 - step: 44660 acc: 0 loss: 1.5139 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6513 data: 0.0589 lr: 7.95e-06 mem: 47% pow: 644.789 W 0: INFO 26-04-30 03:18:49.388659 - 11:43:30 - step: 44670 acc: 0 loss: 1.3625 grad: 1.47e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.9196 data: 0.0627 lr: 7.93e-06 mem: 47% pow: 489.182 W 0: INFO 26-04-30 03:19:05.329172 - 11:43:46 - step: 44680 acc: 0 loss: 1.2987 grad: 1.49e-01 flops: 3.54e+14 wps: 4.11e+04 iter: 0.7577 data: 0.0377 lr: 7.92e-06 mem: 47% pow: 593.973 W 0: INFO 26-04-30 03:19:19.575276 - 11:44:00 - step: 44690 acc: 0 loss: 1.6862 grad: 1.44e-01 flops: 3.97e+14 wps: 4.60e+04 iter: 0.6157 data: 0.096 lr: 7.90e-06 mem: 47% pow: 643.861 W 0: INFO 26-04-30 03:19:34.233136 - 11:44:15 - step: 44700 acc: 0 loss: 1.3321 grad: 1.52e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 0.6488 data: 0.0833 lr: 7.89e-06 mem: 47% pow: 630.337 W 0: INFO 26-04-30 03:19:50.772200 - 11:44:31 - step: 44710 acc: 0 loss: 1.4161 grad: 1.49e-01 flops: 3.42e+14 wps: 3.96e+04 iter: 0.6207 data: 0.0981 lr: 7.87e-06 mem: 54% pow: 652.341 W 0: INFO 26-04-30 03:20:04.480294 - 11:44:45 - step: 44720 acc: 0 loss: 1.5657 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6229 data: 0.0838 lr: 7.86e-06 mem: 47% pow: 651.57 W 0: INFO 26-04-30 03:20:18.080210 - 11:44:58 - step: 44730 acc: 0 loss: 1.1296 grad: 1.56e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5841 data: 0.0921 lr: 7.84e-06 mem: 47% pow: 665.245 W 0: INFO 26-04-30 03:20:31.732877 - 11:45:12 - step: 44740 acc: 0 loss: 1.3723 grad: 2.15e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6021 data: 0.0892 lr: 7.83e-06 mem: 47% pow: 657.0 W 0: INFO 26-04-30 03:20:48.224607 - 11:45:29 - step: 44750 acc: 0 loss: 1.4613 grad: 1.43e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.6588 data: 0.0855 lr: 7.81e-06 mem: 47% pow: 632.644 W 0: INFO 26-04-30 03:21:02.165463 - 11:45:42 - step: 44760 acc: 0 loss: 1.5224 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6626 data: 0.082 lr: 7.80e-06 mem: 47% pow: 629.324 W 0: INFO 26-04-30 03:21:17.173638 - 11:45:57 - step: 44770 acc: 0 loss: 1.332 grad: 1.56e-01 flops: 3.76e+14 wps: 4.37e+04 iter: 1.8713 data: 0.1653 lr: 7.78e-06 mem: 47% pow: 441.012 W 0: INFO 26-04-30 03:21:30.992006 - 11:46:11 - step: 44780 acc: 0 loss: 1.4976 grad: 1.48e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5871 data: 0.0896 lr: 7.77e-06 mem: 47% pow: 668.077 W 0: INFO 26-04-30 03:21:44.700118 - 11:46:25 - step: 44790 acc: 0 loss: 1.4591 grad: 1.44e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5959 data: 0.0863 lr: 7.75e-06 mem: 47% pow: 659.653 W 0: INFO 26-04-30 03:21:58.708148 - 11:46:39 - step: 44800 acc: 0 loss: 1.6948 grad: 1.51e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5787 data: 0.11 lr: 7.74e-06 mem: 47% pow: 658.145 W 0: INFO 26-04-30 03:22:16.021782 - 11:46:56 - step: 44810 acc: 0 loss: 1.5518 grad: 1.98e-01 flops: 3.26e+14 wps: 3.79e+04 iter: 0.5994 data: 0.0873 lr: 7.72e-06 mem: 54% pow: 659.735 W 0: INFO 26-04-30 03:22:30.187894 - 11:47:10 - step: 44820 acc: 0 loss: 1.5786 grad: 1.46e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6191 data: 0.07 lr: 7.71e-06 mem: 47% pow: 666.414 W 0: INFO 26-04-30 03:22:44.093858 - 11:47:24 - step: 44830 acc: 0 loss: 1.2407 grad: 1.46e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6133 data: 0.0794 lr: 7.69e-06 mem: 47% pow: 660.106 W 0: INFO 26-04-30 03:23:02.409602 - 11:47:43 - step: 44840 acc: 0 loss: 1.5122 grad: 1.44e-01 flops: 3.08e+14 wps: 3.58e+04 iter: 0.5933 data: 0.0945 lr: 7.68e-06 mem: 47% pow: 660.183 W 0: INFO 26-04-30 03:23:16.863655 - 11:47:57 - step: 44850 acc: 0 loss: 1.389 grad: 1.47e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6012 data: 0.0839 lr: 7.66e-06 mem: 47% pow: 656.388 W 0: INFO 26-04-30 03:23:32.994712 - 11:48:13 - step: 44860 acc: 0 loss: 1.5256 grad: 1.48e-01 flops: 3.50e+14 wps: 4.07e+04 iter: 0.7316 data: 0.0822 lr: 7.65e-06 mem: 47% pow: 586.697 W 0: INFO 26-04-30 03:23:46.758139 - 11:48:27 - step: 44870 acc: 0 loss: 1.5135 grad: 1.54e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6833 data: 0.0894 lr: 7.63e-06 mem: 47% pow: 621.948 W 0: INFO 26-04-30 03:24:00.713739 - 11:48:41 - step: 44880 acc: 0 loss: 1.6907 grad: 1.44e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6079 data: 0.0838 lr: 7.62e-06 mem: 47% pow: 654.146 W 0: INFO 26-04-30 03:24:14.906770 - 11:48:55 - step: 44890 acc: 0 loss: 1.1991 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6069 data: 0.0859 lr: 7.61e-06 mem: 47% pow: 652.955 W 0: INFO 26-04-30 03:24:28.897109 - 11:49:09 - step: 44900 acc: 0 loss: 1.1179 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6717 data: 0.0803 lr: 7.59e-06 mem: 47% pow: 629.332 W 0: INFO 26-04-30 03:24:45.826745 - 11:49:26 - step: 44910 acc: 0 loss: 1.3074 grad: 1.46e-01 flops: 3.34e+14 wps: 3.87e+04 iter: 0.579 data: 0.0905 lr: 7.58e-06 mem: 54% pow: 669.735 W 0: INFO 26-04-30 03:25:00.424580 - 11:49:41 - step: 44920 acc: 0 loss: 1.4426 grad: 1.45e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.5816 data: 0.09 lr: 7.56e-06 mem: 47% pow: 678.305 W 0: INFO 26-04-30 03:25:14.605550 - 11:49:55 - step: 44930 acc: 0 loss: 2.1498 grad: 1.47e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.6545 data: 0.0938 lr: 7.55e-06 mem: 47% pow: 624.469 W 0: INFO 26-04-30 03:25:28.434993 - 11:50:09 - step: 44940 acc: 0 loss: 1.6818 grad: 1.45e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6041 data: 0.0911 lr: 7.53e-06 mem: 47% pow: 647.826 W 0: INFO 26-04-30 03:25:42.051716 - 11:50:22 - step: 44950 acc: 0 loss: 1.7855 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5855 data: 0.0888 lr: 7.52e-06 mem: 47% pow: 666.466 W 0: INFO 26-04-30 03:26:02.020005 - 11:50:42 - step: 44960 acc: 0 loss: 1.5203 grad: 1.46e-01 flops: 2.83e+14 wps: 3.28e+04 iter: 0.7104 data: 0.0866 lr: 7.50e-06 mem: 47% pow: 597.378 W 0: INFO 26-04-30 03:26:15.816919 - 11:50:56 - step: 44970 acc: 0 loss: 1.5967 grad: 1.44e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6211 data: 0.0748 lr: 7.49e-06 mem: 47% pow: 649.325 W 0: INFO 26-04-30 03:26:29.566149 - 11:51:10 - step: 44980 acc: 0 loss: 1.4817 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6276 data: 0.0619 lr: 7.47e-06 mem: 47% pow: 660.175 W 0: INFO 26-04-30 03:26:43.487182 - 11:51:24 - step: 44990 acc: 0 loss: 2.0016 grad: 1.45e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6043 data: 0.0865 lr: 7.46e-06 mem: 47% pow: 656.96 W 0: INFO 26-04-30 03:26:57.516945 - 11:51:38 - step: 45000 acc: 0 loss: 1.3711 grad: 1.43e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.7663 data: 0.0965 lr: 7.44e-06 mem: 47% pow: 557.512 W 0: INFO 26-04-30 03:26:57.521632 - 11:51:38 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000045000 0: INFO 26-04-30 03:26:57.522027 - 11:51:38 - Saving... 0: INFO 26-04-30 03:27:03.365071 - 11:51:44 - State dict saved! 0: INFO 26-04-30 03:27:03.441474 - 11:51:44 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000045000/train_state_00000.json 0: INFO 26-04-30 03:27:03.445878 - 11:51:44 - Train state saved ! 0: INFO 26-04-30 03:27:03.446348 - 11:51:44 - Cleaning up checkpoints... 0: INFO 26-04-30 03:27:03.446550 - 11:51:44 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000040000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000045000')] 0: INFO 26-04-30 03:27:03.447251 - 11:51:44 - Eval folders: [] 0: INFO 26-04-30 03:27:03.447406 - 11:51:44 - Other folders: [] 0: INFO 26-04-30 03:27:03.447530 - 11:51:44 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000040000')} 0: INFO 26-04-30 03:27:07.528689 - 11:51:48 - garbage collection 0: INFO 26-04-30 03:27:22.098259 - 11:52:02 - step: 45010 acc: 0 loss: 1.3018 grad: 1.49e-01 flops: 2.30e+14 wps: 2.67e+04 iter: 0.5857 data: 0.0906 lr: 7.43e-06 mem: 54% pow: 667.773 W 0: INFO 26-04-30 03:27:35.989363 - 11:52:16 - step: 45020 acc: 0 loss: 1.76 grad: 1.64e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7018 data: 0.0841 lr: 7.41e-06 mem: 47% pow: 606.492 W 0: INFO 26-04-30 03:27:49.670068 - 11:52:30 - step: 45030 acc: 0 loss: 1.5936 grad: 1.59e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6208 data: 0.0714 lr: 7.40e-06 mem: 47% pow: 650.252 W 0: INFO 26-04-30 03:28:03.413848 - 11:52:44 - step: 45040 acc: 0 loss: 1.2606 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6074 data: 0.0851 lr: 7.38e-06 mem: 47% pow: 659.208 W 0: INFO 26-04-30 03:28:17.369642 - 11:52:58 - step: 45050 acc: 0 loss: 1.6781 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7093 data: 0.0798 lr: 7.37e-06 mem: 47% pow: 606.366 W 0: INFO 26-04-30 03:28:32.041055 - 11:53:12 - step: 45060 acc: 0 loss: 1.319 grad: 1.53e-01 flops: 3.85e+14 wps: 4.47e+04 iter: 1.2565 data: 0.1 lr: 7.35e-06 mem: 47% pow: 418.331 W 0: INFO 26-04-30 03:28:46.629277 - 11:53:27 - step: 45070 acc: 0 loss: 1.479 grad: 1.49e-01 flops: 3.87e+14 wps: 4.49e+04 iter: 0.6457 data: 0.086 lr: 7.34e-06 mem: 47% pow: 634.772 W 0: INFO 26-04-30 03:29:00.331350 - 11:53:41 - step: 45080 acc: 0 loss: 1.4445 grad: 1.55e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.7241 data: 0.0975 lr: 7.32e-06 mem: 47% pow: 587.147 W 0: INFO 26-04-30 03:29:14.313390 - 11:53:55 - step: 45090 acc: 0 loss: 1.3781 grad: 1.58e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.662 data: 0.0679 lr: 7.31e-06 mem: 47% pow: 631.316 W 0: INFO 26-04-30 03:29:28.462485 - 11:54:09 - step: 45100 acc: 0 loss: 1.2322 grad: 1.52e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.8679 data: 0.1171 lr: 7.29e-06 mem: 47% pow: 498.087 W 0: INFO 26-04-30 03:29:46.001279 - 11:54:26 - step: 45110 acc: 0 loss: 1.402 grad: 1.75e-01 flops: 3.22e+14 wps: 3.74e+04 iter: 0.5792 data: 0.0873 lr: 7.28e-06 mem: 54% pow: 680.088 W 0: INFO 26-04-30 03:29:59.492875 - 11:54:40 - step: 45120 acc: 0 loss: 1.3377 grad: 1.52e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5819 data: 0.0934 lr: 7.26e-06 mem: 47% pow: 653.785 W 0: INFO 26-04-30 03:30:13.480336 - 11:54:54 - step: 45130 acc: 0 loss: 1.3048 grad: 1.48e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5914 data: 0.0832 lr: 7.25e-06 mem: 47% pow: 662.668 W 0: INFO 26-04-30 03:30:27.263894 - 11:55:08 - step: 45140 acc: 0 loss: 1.6295 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5804 data: 0.0936 lr: 7.23e-06 mem: 47% pow: 670.145 W 0: INFO 26-04-30 03:30:40.973567 - 11:55:21 - step: 45150 acc: 0 loss: 1.2865 grad: 1.66e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6051 data: 0.1247 lr: 7.22e-06 mem: 47% pow: 635.922 W 0: INFO 26-04-30 03:30:54.740896 - 11:55:35 - step: 45160 acc: 0 loss: 1.1785 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6088 data: 0.0937 lr: 7.20e-06 mem: 47% pow: 656.666 W 0: INFO 26-04-30 03:31:12.209821 - 11:55:53 - step: 45170 acc: 0 loss: 1.2399 grad: 1.51e-01 flops: 3.23e+14 wps: 3.75e+04 iter: 0.6885 data: 0.0034 lr: 7.19e-06 mem: 47% pow: 654.411 W 0: INFO 26-04-30 03:31:25.910276 - 11:56:06 - step: 45180 acc: 0 loss: 1.5273 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6921 data: 0.0035 lr: 7.17e-06 mem: 47% pow: 652.078 W 0: INFO 26-04-30 03:31:40.049092 - 11:56:20 - step: 45190 acc: 0 loss: 1.4731 grad: 1.51e-01 flops: 3.99e+14 wps: 4.64e+04 iter: 0.6073 data: 0.0833 lr: 7.16e-06 mem: 47% pow: 658.748 W 0: INFO 26-04-30 03:31:53.759928 - 11:56:34 - step: 45200 acc: 0 loss: 1.191 grad: 1.58e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6141 data: 0.0852 lr: 7.14e-06 mem: 47% pow: 651.618 W 0: INFO 26-04-30 03:32:10.438518 - 11:56:51 - step: 45210 acc: 0 loss: 1.6039 grad: 1.61e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.6076 data: 0.0753 lr: 7.13e-06 mem: 54% pow: 671.927 W 0: INFO 26-04-30 03:32:27.644977 - 11:57:08 - step: 45220 acc: 0 loss: 1.5963 grad: 1.48e-01 flops: 3.28e+14 wps: 3.81e+04 iter: 0.5945 data: 0.0945 lr: 7.11e-06 mem: 47% pow: 664.165 W 0: INFO 26-04-30 03:32:41.477517 - 11:57:22 - step: 45230 acc: 0 loss: 1.7332 grad: 1.47e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5981 data: 0.0812 lr: 7.10e-06 mem: 47% pow: 654.746 W 0: INFO 26-04-30 03:32:55.340931 - 11:57:36 - step: 45240 acc: 0 loss: 1.5076 grad: 1.65e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6296 data: 0.0855 lr: 7.08e-06 mem: 47% pow: 634.571 W 0: INFO 26-04-30 03:33:09.082637 - 11:57:49 - step: 45250 acc: 0 loss: 1.5466 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5953 data: 0.0878 lr: 7.07e-06 mem: 47% pow: 662.08 W 0: INFO 26-04-30 03:33:23.161596 - 11:58:03 - step: 45260 acc: 0 loss: 1.2038 grad: 1.60e-01 flops: 4.02e+14 wps: 4.66e+04 iter: 0.585 data: 0.0861 lr: 7.05e-06 mem: 47% pow: 664.477 W 0: INFO 26-04-30 03:33:36.892184 - 11:58:17 - step: 45270 acc: 0 loss: 1.1273 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6122 data: 0.0955 lr: 7.04e-06 mem: 47% pow: 644.854 W 0: INFO 26-04-30 03:33:50.756742 - 11:58:31 - step: 45280 acc: 0 loss: 0.9788 grad: 1.56e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5876 data: 0.0896 lr: 7.02e-06 mem: 47% pow: 658.406 W 0: INFO 26-04-30 03:34:05.277902 - 11:58:46 - step: 45290 acc: 0 loss: 1.4469 grad: 1.51e-01 flops: 3.89e+14 wps: 4.52e+04 iter: 0.5978 data: 0.0804 lr: 7.01e-06 mem: 47% pow: 654.801 W 0: INFO 26-04-30 03:34:19.293751 - 11:59:00 - step: 45300 acc: 0 loss: 1.2195 grad: 1.53e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5821 data: 0.0961 lr: 7.00e-06 mem: 47% pow: 659.599 W 0: INFO 26-04-30 03:34:35.846596 - 11:59:16 - step: 45310 acc: 0 loss: 1.3164 grad: 1.52e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.617 data: 0.095 lr: 6.98e-06 mem: 54% pow: 662.268 W 0: INFO 26-04-30 03:34:49.778627 - 11:59:30 - step: 45320 acc: 0 loss: 1.4654 grad: 1.51e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.6191 data: 0.0807 lr: 6.97e-06 mem: 47% pow: 653.225 W 0: INFO 26-04-30 03:35:03.574545 - 11:59:44 - step: 45330 acc: 0 loss: 1.4315 grad: 1.58e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.5922 data: 0.0807 lr: 6.95e-06 mem: 47% pow: 665.167 W 0: INFO 26-04-30 03:35:17.266258 - 11:59:58 - step: 45340 acc: 0 loss: 1.6864 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.581 data: 0.0861 lr: 6.94e-06 mem: 47% pow: 672.516 W 0: INFO 26-04-30 03:35:30.794674 - 12:00:11 - step: 45350 acc: 0 loss: 1.2302 grad: 3.25e-01 flops: 4.17e+14 wps: 4.85e+04 iter: 0.6298 data: 0.0659 lr: 6.92e-06 mem: 47% pow: 659.346 W 0: INFO 26-04-30 03:35:44.377160 - 12:00:25 - step: 45360 acc: 0 loss: 1.2676 grad: 1.71e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5788 data: 0.1144 lr: 6.91e-06 mem: 47% pow: 660.374 W 0: INFO 26-04-30 03:35:58.097074 - 12:00:38 - step: 45370 acc: 0 loss: 1.1957 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5799 data: 0.1015 lr: 6.89e-06 mem: 47% pow: 657.386 W 0: INFO 26-04-30 03:36:11.830045 - 12:00:52 - step: 45380 acc: 0 loss: 1.8561 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.7641 data: 0.0895 lr: 6.88e-06 mem: 47% pow: 569.346 W 0: INFO 26-04-30 03:36:25.743688 - 12:01:06 - step: 45390 acc: 0 loss: 1.0679 grad: 1.49e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.8049 data: 0.0836 lr: 6.86e-06 mem: 47% pow: 547.213 W 0: INFO 26-04-30 03:36:46.371881 - 12:01:27 - step: 45400 acc: 0 loss: 1.4643 grad: 1.54e-01 flops: 2.74e+14 wps: 3.18e+04 iter: 0.6042 data: 0.0848 lr: 6.85e-06 mem: 47% pow: 664.04 W 0: INFO 26-04-30 03:37:03.292654 - 12:01:44 - step: 45410 acc: 0 loss: 1.3086 grad: 1.46e-01 flops: 3.34e+14 wps: 3.87e+04 iter: 0.6502 data: 0.0881 lr: 6.83e-06 mem: 54% pow: 629.64 W 0: INFO 26-04-30 03:37:17.061586 - 12:01:57 - step: 45420 acc: 0 loss: 1.5342 grad: 1.51e-01 flops: 4.11e+14 wps: 4.76e+04 iter: 0.5817 data: 0.1316 lr: 6.82e-06 mem: 47% pow: 639.539 W 0: INFO 26-04-30 03:37:31.081413 - 12:02:11 - step: 45430 acc: 0 loss: 1.4028 grad: 1.44e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5927 data: 0.1352 lr: 6.80e-06 mem: 47% pow: 645.571 W 0: INFO 26-04-30 03:37:48.999097 - 12:02:29 - step: 45440 acc: 0 loss: 1.4521 grad: 1.48e-01 flops: 3.15e+14 wps: 3.66e+04 iter: 0.5881 data: 0.0862 lr: 6.79e-06 mem: 47% pow: 667.847 W 0: INFO 26-04-30 03:38:03.104582 - 12:02:43 - step: 45450 acc: 0 loss: 1.2679 grad: 1.50e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.5987 data: 0.0724 lr: 6.77e-06 mem: 47% pow: 685.129 W 0: INFO 26-04-30 03:38:17.073440 - 12:02:57 - step: 45460 acc: 0 loss: 1.1853 grad: 1.54e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5978 data: 0.0773 lr: 6.76e-06 mem: 47% pow: 661.146 W 0: INFO 26-04-30 03:38:30.657319 - 12:03:11 - step: 45470 acc: 0 loss: 1.1252 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5971 data: 0.0821 lr: 6.74e-06 mem: 47% pow: 657.712 W 0: INFO 26-04-30 03:38:44.644835 - 12:03:25 - step: 45480 acc: 0 loss: 1.2906 grad: 1.44e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.5846 data: 0.0966 lr: 6.73e-06 mem: 47% pow: 651.51 W 0: INFO 26-04-30 03:38:58.457510 - 12:03:39 - step: 45490 acc: 0 loss: 1.4987 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6622 data: 0.093 lr: 6.71e-06 mem: 47% pow: 622.612 W 0: INFO 26-04-30 03:39:12.245913 - 12:03:53 - step: 45500 acc: 0 loss: 1.0593 grad: 1.44e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.5994 data: 0.0876 lr: 6.70e-06 mem: 47% pow: 669.261 W 0: INFO 26-04-30 03:39:29.107937 - 12:04:09 - step: 45510 acc: 0 loss: 1.4626 grad: 1.61e-01 flops: 3.35e+14 wps: 3.89e+04 iter: 0.5874 data: 0.0829 lr: 6.68e-06 mem: 54% pow: 677.843 W 0: INFO 26-04-30 03:39:43.062054 - 12:04:23 - step: 45520 acc: 0 loss: 1.2221 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5997 data: 0.0829 lr: 6.67e-06 mem: 47% pow: 657.869 W 0: INFO 26-04-30 03:39:56.766225 - 12:04:37 - step: 45530 acc: 0 loss: 1.0216 grad: 2.10e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5989 data: 0.082 lr: 6.65e-06 mem: 47% pow: 660.605 W 0: INFO 26-04-30 03:40:10.467325 - 12:04:51 - step: 45540 acc: 0 loss: 1.2529 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6109 data: 0.0801 lr: 6.64e-06 mem: 47% pow: 647.448 W 0: INFO 26-04-30 03:40:24.137435 - 12:05:04 - step: 45550 acc: 0 loss: 1.2094 grad: 1.67e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6076 data: 0.0897 lr: 6.62e-06 mem: 47% pow: 649.344 W 0: INFO 26-04-30 03:40:38.046720 - 12:05:18 - step: 45560 acc: 0 loss: 1.5958 grad: 1.51e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5929 data: 0.0905 lr: 6.61e-06 mem: 47% pow: 661.678 W 0: INFO 26-04-30 03:40:52.307829 - 12:05:33 - step: 45570 acc: 0 loss: 1.3667 grad: 1.63e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.7423 data: 0.084 lr: 6.59e-06 mem: 47% pow: 589.762 W 0: INFO 26-04-30 03:41:06.041747 - 12:05:46 - step: 45580 acc: 0 loss: 1.3081 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5997 data: 0.0969 lr: 6.58e-06 mem: 47% pow: 653.982 W 0: INFO 26-04-30 03:41:19.669983 - 12:06:00 - step: 45590 acc: 0 loss: 1.388 grad: 1.51e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5905 data: 0.0837 lr: 6.56e-06 mem: 47% pow: 668.732 W 0: INFO 26-04-30 03:41:33.329812 - 12:06:14 - step: 45600 acc: 0 loss: 1.5801 grad: 1.44e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.654 data: 0.0769 lr: 6.55e-06 mem: 47% pow: 636.421 W 0: INFO 26-04-30 03:41:50.042622 - 12:06:30 - step: 45610 acc: 0 loss: 1.4583 grad: 1.48e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6057 data: 0.0788 lr: 6.53e-06 mem: 54% pow: 666.626 W 0: INFO 26-04-30 03:42:03.632760 - 12:06:44 - step: 45620 acc: 0 loss: 1.7359 grad: 1.49e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5987 data: 0.0841 lr: 6.52e-06 mem: 47% pow: 663.077 W 0: INFO 26-04-30 03:42:17.434819 - 12:06:58 - step: 45630 acc: 0 loss: 1.5439 grad: 1.48e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6129 data: 0.0827 lr: 6.50e-06 mem: 47% pow: 647.046 W 0: INFO 26-04-30 03:42:31.046029 - 12:07:11 - step: 45640 acc: 0 loss: 2.0066 grad: 1.47e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5809 data: 0.0845 lr: 6.49e-06 mem: 47% pow: 674.983 W 0: INFO 26-04-30 03:42:44.971157 - 12:07:25 - step: 45650 acc: 0 loss: 1.2762 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6263 data: 0.0937 lr: 6.47e-06 mem: 47% pow: 659.431 W 0: INFO 26-04-30 03:42:58.924224 - 12:07:39 - step: 45660 acc: 0 loss: 1.4767 grad: 1.44e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6564 data: 0.0827 lr: 6.46e-06 mem: 47% pow: 627.921 W 0: INFO 26-04-30 03:43:12.688282 - 12:07:53 - step: 45670 acc: 0 loss: 1.3665 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6109 data: 0.0725 lr: 6.44e-06 mem: 47% pow: 658.956 W 0: INFO 26-04-30 03:43:26.526089 - 12:08:07 - step: 45680 acc: 0 loss: 1.4679 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5796 data: 0.1069 lr: 6.43e-06 mem: 47% pow: 658.745 W 0: INFO 26-04-30 03:43:43.866143 - 12:08:24 - step: 45690 acc: 0 loss: 1.4544 grad: 1.45e-01 flops: 3.26e+14 wps: 3.78e+04 iter: 0.6162 data: 0.0892 lr: 6.41e-06 mem: 47% pow: 648.677 W 0: INFO 26-04-30 03:43:57.722390 - 12:08:38 - step: 45700 acc: 0 loss: 1.4659 grad: 1.51e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6352 data: 0.0858 lr: 6.40e-06 mem: 47% pow: 645.287 W 0: INFO 26-04-30 03:44:17.225944 - 12:08:58 - step: 45710 acc: 0 loss: 1.678 grad: 1.45e-01 flops: 2.90e+14 wps: 3.36e+04 iter: 0.5904 data: 0.0884 lr: 6.39e-06 mem: 54% pow: 660.34 W 0: INFO 26-04-30 03:44:31.046329 - 12:09:11 - step: 45720 acc: 0 loss: 1.4275 grad: 1.58e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5811 data: 0.0873 lr: 6.37e-06 mem: 47% pow: 674.011 W 0: INFO 26-04-30 03:44:44.648612 - 12:09:25 - step: 45730 acc: 0 loss: 1.5954 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6011 data: 0.0888 lr: 6.36e-06 mem: 47% pow: 655.571 W 0: INFO 26-04-30 03:44:58.048556 - 12:09:38 - step: 45740 acc: 0 loss: 1.3444 grad: 1.45e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.58 data: 0.0909 lr: 6.34e-06 mem: 47% pow: 672.76 W 0: INFO 26-04-30 03:45:11.738738 - 12:09:52 - step: 45750 acc: 0 loss: 1.5438 grad: 1.41e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6666 data: 0.0808 lr: 6.33e-06 mem: 47% pow: 632.513 W 0: INFO 26-04-30 03:45:25.429918 - 12:10:06 - step: 45760 acc: 0 loss: 1.7824 grad: 1.45e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6216 data: 0.0882 lr: 6.31e-06 mem: 47% pow: 655.726 W 0: INFO 26-04-30 03:45:39.033875 - 12:10:19 - step: 45770 acc: 0 loss: 1.2726 grad: 1.42e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5867 data: 0.0891 lr: 6.30e-06 mem: 47% pow: 666.083 W 0: INFO 26-04-30 03:45:52.952277 - 12:10:33 - step: 45780 acc: 0 loss: 1.5336 grad: 1.47e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6309 data: 0.0967 lr: 6.28e-06 mem: 47% pow: 636.84 W 0: INFO 26-04-30 03:46:06.721722 - 12:10:47 - step: 45790 acc: 0 loss: 1.5468 grad: 1.52e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.7049 data: 0.0566 lr: 6.27e-06 mem: 47% pow: 612.239 W 0: INFO 26-04-30 03:46:20.627462 - 12:11:01 - step: 45800 acc: 0 loss: 1.2273 grad: 1.47e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6076 data: 0.0931 lr: 6.25e-06 mem: 47% pow: 646.365 W 0: INFO 26-04-30 03:46:37.456907 - 12:11:18 - step: 45810 acc: 0 loss: 1.2245 grad: 1.52e-01 flops: 3.36e+14 wps: 3.89e+04 iter: 0.5979 data: 0.0805 lr: 6.24e-06 mem: 54% pow: 665.755 W 0: INFO 26-04-30 03:46:51.187755 - 12:11:31 - step: 45820 acc: 0 loss: 1.1346 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5952 data: 0.0939 lr: 6.22e-06 mem: 47% pow: 655.273 W 0: INFO 26-04-30 03:47:05.044810 - 12:11:45 - step: 45830 acc: 0 loss: 1.5714 grad: 1.47e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5821 data: 0.1446 lr: 6.21e-06 mem: 47% pow: 640.238 W 0: INFO 26-04-30 03:47:25.722200 - 12:12:06 - step: 45840 acc: 0 loss: 1.8228 grad: 1.49e-01 flops: 2.73e+14 wps: 3.17e+04 iter: 0.6008 data: 0.0949 lr: 6.19e-06 mem: 47% pow: 659.626 W 0: INFO 26-04-30 03:47:39.122999 - 12:12:19 - step: 45850 acc: 0 loss: 1.5503 grad: 1.45e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.6429 data: 0.1 lr: 6.18e-06 mem: 47% pow: 626.688 W 0: INFO 26-04-30 03:47:52.812111 - 12:12:33 - step: 45860 acc: 0 loss: 1.6374 grad: 1.42e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6038 data: 0.0813 lr: 6.16e-06 mem: 47% pow: 664.734 W 0: INFO 26-04-30 03:48:07.217715 - 12:12:48 - step: 45870 acc: 0 loss: 1.4561 grad: 1.51e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6096 data: 0.0837 lr: 6.15e-06 mem: 47% pow: 656.96 W 0: INFO 26-04-30 03:48:20.635095 - 12:13:01 - step: 45880 acc: 0 loss: 1.4341 grad: 1.45e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5965 data: 0.0861 lr: 6.13e-06 mem: 47% pow: 656.082 W 0: INFO 26-04-30 03:48:34.273238 - 12:13:15 - step: 45890 acc: 0 loss: 1.2453 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6263 data: 0.0623 lr: 6.12e-06 mem: 47% pow: 654.789 W 0: INFO 26-04-30 03:48:48.073576 - 12:13:28 - step: 45900 acc: 0 loss: 1.353 grad: 1.46e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6312 data: 0.0827 lr: 6.10e-06 mem: 47% pow: 640.54 W 0: INFO 26-04-30 03:49:04.578015 - 12:13:45 - step: 45910 acc: 0 loss: 1.5528 grad: 1.51e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5826 data: 0.0919 lr: 6.09e-06 mem: 54% pow: 664.017 W 0: INFO 26-04-30 03:49:18.230116 - 12:13:59 - step: 45920 acc: 0 loss: 1.5827 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5918 data: 0.0929 lr: 6.07e-06 mem: 47% pow: 670.907 W 0: INFO 26-04-30 03:49:31.850495 - 12:14:12 - step: 45930 acc: 0 loss: 1.1075 grad: 1.41e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5972 data: 0.0849 lr: 6.06e-06 mem: 47% pow: 657.139 W 0: INFO 26-04-30 03:49:45.369571 - 12:14:26 - step: 45940 acc: 0 loss: 2.1064 grad: 1.56e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6048 data: 0.0834 lr: 6.04e-06 mem: 47% pow: 656.393 W 0: INFO 26-04-30 03:49:59.750887 - 12:14:40 - step: 45950 acc: 0 loss: 1.49 grad: 1.71e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6207 data: 0.0874 lr: 6.03e-06 mem: 47% pow: 639.387 W 0: INFO 26-04-30 03:50:13.798710 - 12:14:54 - step: 45960 acc: 0 loss: 2.4854 grad: 1.40e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6054 data: 0.0684 lr: 6.01e-06 mem: 47% pow: 670.997 W 0: INFO 26-04-30 03:50:27.756237 - 12:15:08 - step: 45970 acc: 0 loss: 1.252 grad: 1.42e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.5915 data: 0.0895 lr: 6.00e-06 mem: 47% pow: 655.473 W 0: INFO 26-04-30 03:50:41.548322 - 12:15:22 - step: 45980 acc: 0 loss: 1.3553 grad: 1.39e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6089 data: 0.1392 lr: 5.98e-06 mem: 47% pow: 622.55 W 0: INFO 26-04-30 03:50:55.226612 - 12:15:36 - step: 45990 acc: 0 loss: 1.3716 grad: 1.95e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5932 data: 0.0935 lr: 5.97e-06 mem: 47% pow: 662.657 W 0: INFO 26-04-30 03:51:09.054440 - 12:15:49 - step: 46000 acc: 0 loss: 1.6636 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6024 data: 0.086 lr: 5.95e-06 mem: 47% pow: 664.876 W 0: INFO 26-04-30 03:51:12.749728 - 12:15:53 - garbage collection 0: INFO 26-04-30 03:51:27.261823 - 12:16:08 - step: 46010 acc: 0 loss: 1.5236 grad: 1.44e-01 flops: 3.10e+14 wps: 3.60e+04 iter: 0.5914 data: 0.0926 lr: 5.94e-06 mem: 54% pow: 678.539 W 0: INFO 26-04-30 03:51:41.025946 - 12:16:21 - step: 46020 acc: 0 loss: 1.2747 grad: 1.45e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.597 data: 0.0957 lr: 5.92e-06 mem: 47% pow: 653.001 W 0: INFO 26-04-30 03:51:57.245006 - 12:16:38 - step: 46030 acc: 0 loss: 1.859 grad: 1.45e-01 flops: 3.48e+14 wps: 4.04e+04 iter: 0.6284 data: 0.0896 lr: 5.91e-06 mem: 47% pow: 641.928 W 0: INFO 26-04-30 03:52:11.043717 - 12:16:51 - step: 46040 acc: 0 loss: 1.5752 grad: 1.41e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.7061 data: 0.0873 lr: 5.89e-06 mem: 47% pow: 600.155 W 0: INFO 26-04-30 03:52:25.038804 - 12:17:05 - step: 46050 acc: 0 loss: 1.57 grad: 1.43e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.936 data: 0.0788 lr: 5.88e-06 mem: 47% pow: 474.249 W 0: INFO 26-04-30 03:52:38.651190 - 12:17:19 - step: 46060 acc: 0 loss: 1.3496 grad: 1.46e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5959 data: 0.0888 lr: 5.86e-06 mem: 47% pow: 664.024 W 0: INFO 26-04-30 03:52:52.362820 - 12:17:33 - step: 46070 acc: 0 loss: 1.3588 grad: 1.42e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6061 data: 0.0848 lr: 5.85e-06 mem: 47% pow: 671.877 W 0: INFO 26-04-30 03:53:06.275340 - 12:17:47 - step: 46080 acc: 0 loss: 1.4244 grad: 1.44e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6023 data: 0.0886 lr: 5.83e-06 mem: 47% pow: 656.971 W 0: INFO 26-04-30 03:53:20.243359 - 12:18:01 - step: 46090 acc: 0 loss: 1.5973 grad: 1.43e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6079 data: 0.092 lr: 5.82e-06 mem: 47% pow: 654.786 W 0: INFO 26-04-30 03:53:33.968369 - 12:18:14 - step: 46100 acc: 0 loss: 1.41 grad: 1.38e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5915 data: 0.0909 lr: 5.80e-06 mem: 47% pow: 661.859 W 0: INFO 26-04-30 03:53:50.793969 - 12:18:31 - step: 46110 acc: 0 loss: 1.3478 grad: 1.39e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5973 data: 0.0882 lr: 5.79e-06 mem: 54% pow: 658.772 W 0: INFO 26-04-30 03:54:04.398211 - 12:18:45 - step: 46120 acc: 0 loss: 1.6587 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5914 data: 0.0851 lr: 5.77e-06 mem: 47% pow: 662.81 W 0: INFO 26-04-30 03:54:18.130995 - 12:18:58 - step: 46130 acc: 0 loss: 1.1833 grad: 1.41e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5794 data: 0.11 lr: 5.76e-06 mem: 47% pow: 657.019 W 0: INFO 26-04-30 03:54:31.809278 - 12:19:12 - step: 46140 acc: 0 loss: 1.7052 grad: 1.41e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6399 data: 0.0879 lr: 5.75e-06 mem: 47% pow: 632.404 W 0: INFO 26-04-30 03:54:45.440844 - 12:19:26 - step: 46150 acc: 0 loss: 1.7472 grad: 1.42e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6358 data: 0.0944 lr: 5.73e-06 mem: 47% pow: 636.385 W 0: INFO 26-04-30 03:54:59.246223 - 12:19:40 - step: 46160 acc: 0 loss: 1.5763 grad: 1.41e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6085 data: 0.0707 lr: 5.72e-06 mem: 47% pow: 665.205 W 0: INFO 26-04-30 03:55:13.057908 - 12:19:53 - step: 46170 acc: 0 loss: 1.4598 grad: 1.41e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5783 data: 0.0978 lr: 5.70e-06 mem: 47% pow: 666.298 W 0: INFO 26-04-30 03:55:26.553975 - 12:20:07 - step: 46180 acc: 0 loss: 1.4489 grad: 1.40e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6014 data: 0.0903 lr: 5.69e-06 mem: 47% pow: 651.683 W 0: INFO 26-04-30 03:55:40.183883 - 12:20:20 - step: 46190 acc: 0 loss: 1.9127 grad: 1.37e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6271 data: 0.0736 lr: 5.67e-06 mem: 47% pow: 654.765 W 0: INFO 26-04-30 03:55:53.893047 - 12:20:34 - step: 46200 acc: 0 loss: 1.3711 grad: 1.39e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5945 data: 0.0934 lr: 5.66e-06 mem: 47% pow: 658.889 W 0: INFO 26-04-30 03:56:10.640301 - 12:20:51 - step: 46210 acc: 0 loss: 1.277 grad: 1.57e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.6794 data: 0.0953 lr: 5.64e-06 mem: 54% pow: 606.178 W 0: INFO 26-04-30 03:56:24.497975 - 12:21:05 - step: 46220 acc: 0 loss: 1.7986 grad: 1.41e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6042 data: 0.0853 lr: 5.63e-06 mem: 47% pow: 662.462 W 0: INFO 26-04-30 03:56:38.253516 - 12:21:19 - step: 46230 acc: 0 loss: 1.5506 grad: 1.37e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.582 data: 0.107 lr: 5.61e-06 mem: 47% pow: 658.652 W 0: INFO 26-04-30 03:56:52.031681 - 12:21:32 - step: 46240 acc: 0 loss: 1.2399 grad: 1.40e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6479 data: 0.0932 lr: 5.60e-06 mem: 47% pow: 637.079 W 0: INFO 26-04-30 03:57:05.997674 - 12:21:46 - step: 46250 acc: 0 loss: 1.5647 grad: 1.45e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6082 data: 0.0999 lr: 5.58e-06 mem: 47% pow: 643.359 W 0: INFO 26-04-30 03:57:19.791445 - 12:22:00 - step: 46260 acc: 0 loss: 1.5437 grad: 1.46e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6279 data: 0.0723 lr: 5.57e-06 mem: 47% pow: 648.4 W 0: INFO 26-04-30 03:57:33.430682 - 12:22:14 - step: 46270 acc: 0 loss: 1.5578 grad: 1.40e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5878 data: 0.0996 lr: 5.55e-06 mem: 47% pow: 662.704 W 0: INFO 26-04-30 03:57:47.022166 - 12:22:27 - step: 46280 acc: 0 loss: 1.4262 grad: 1.39e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.6027 data: 0.0945 lr: 5.54e-06 mem: 47% pow: 651.493 W 0: INFO 26-04-30 03:58:00.899734 - 12:22:41 - step: 46290 acc: 0 loss: 1.7824 grad: 1.40e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.5798 data: 0.1144 lr: 5.52e-06 mem: 47% pow: 649.584 W 0: INFO 26-04-30 03:58:14.790375 - 12:22:55 - step: 46300 acc: 0 loss: 1.6101 grad: 1.41e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5945 data: 0.0931 lr: 5.51e-06 mem: 47% pow: 663.882 W 0: INFO 26-04-30 03:58:31.691789 - 12:23:12 - step: 46310 acc: 0 loss: 1.5833 grad: 1.39e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6186 data: 0.1026 lr: 5.49e-06 mem: 54% pow: 627.022 W 0: INFO 26-04-30 03:58:45.328174 - 12:23:26 - step: 46320 acc: 0 loss: 1.3742 grad: 1.41e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6159 data: 0.0897 lr: 5.48e-06 mem: 47% pow: 653.402 W 0: INFO 26-04-30 03:58:59.154876 - 12:23:39 - step: 46330 acc: 0 loss: 1.4638 grad: 1.42e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.595 data: 0.0877 lr: 5.46e-06 mem: 47% pow: 662.106 W 0: INFO 26-04-30 03:59:13.320223 - 12:23:54 - step: 46340 acc: 0 loss: 1.547 grad: 1.40e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5897 data: 0.0851 lr: 5.45e-06 mem: 47% pow: 661.407 W 0: INFO 26-04-30 03:59:26.962532 - 12:24:07 - step: 46350 acc: 0 loss: 1.1861 grad: 1.39e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6454 data: 0.0941 lr: 5.43e-06 mem: 47% pow: 625.687 W 0: INFO 26-04-30 03:59:40.447273 - 12:24:21 - step: 46360 acc: 0 loss: 1.504 grad: 1.36e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6023 data: 0.0811 lr: 5.42e-06 mem: 47% pow: 662.149 W 0: INFO 26-04-30 03:59:53.986461 - 12:24:34 - step: 46370 acc: 0 loss: 1.3346 grad: 1.39e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6128 data: 0.0879 lr: 5.40e-06 mem: 47% pow: 649.023 W 0: INFO 26-04-30 04:00:07.617596 - 12:24:48 - step: 46380 acc: 0 loss: 1.7306 grad: 1.42e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5997 data: 0.0855 lr: 5.39e-06 mem: 47% pow: 670.371 W 0: INFO 26-04-30 04:00:21.072824 - 12:25:01 - step: 46390 acc: 0 loss: 1.6909 grad: 1.43e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5976 data: 0.0913 lr: 5.37e-06 mem: 47% pow: 662.198 W 0: INFO 26-04-30 04:00:34.647634 - 12:25:15 - step: 46400 acc: 0 loss: 1.487 grad: 1.41e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5996 data: 0.0732 lr: 5.36e-06 mem: 47% pow: 674.486 W 0: INFO 26-04-30 04:00:51.233699 - 12:25:32 - step: 46410 acc: 0 loss: 1.7246 grad: 1.43e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.578 data: 0.0928 lr: 5.34e-06 mem: 54% pow: 676.741 W 0: INFO 26-04-30 04:01:05.055379 - 12:25:45 - step: 46420 acc: 0 loss: 1.5759 grad: 1.42e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6069 data: 0.0816 lr: 5.33e-06 mem: 47% pow: 656.33 W 0: INFO 26-04-30 04:01:18.705580 - 12:25:59 - step: 46430 acc: 0 loss: 1.4969 grad: 1.37e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5963 data: 0.0847 lr: 5.31e-06 mem: 47% pow: 661.858 W 0: INFO 26-04-30 04:01:32.234156 - 12:26:13 - step: 46440 acc: 0 loss: 1.5589 grad: 1.41e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.593 data: 0.0889 lr: 5.30e-06 mem: 47% pow: 661.105 W 0: INFO 26-04-30 04:01:45.949930 - 12:26:26 - step: 46450 acc: 0 loss: 1.4005 grad: 1.43e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5949 data: 0.0871 lr: 5.28e-06 mem: 47% pow: 661.432 W 0: INFO 26-04-30 04:02:01.865610 - 12:26:42 - step: 46460 acc: 0 loss: 1.2447 grad: 1.44e-01 flops: 3.55e+14 wps: 4.12e+04 iter: 0.6103 data: 0.0849 lr: 5.27e-06 mem: 47% pow: 658.411 W 0: INFO 26-04-30 04:02:15.434105 - 12:26:56 - step: 46470 acc: 0 loss: 1.4557 grad: 1.37e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5882 data: 0.0941 lr: 5.25e-06 mem: 47% pow: 656.56 W 0: INFO 26-04-30 04:02:28.996568 - 12:27:09 - step: 46480 acc: 0 loss: 1.4288 grad: 1.39e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6123 data: 0.0993 lr: 5.24e-06 mem: 47% pow: 636.672 W 0: INFO 26-04-30 04:02:42.543540 - 12:27:23 - step: 46490 acc: 0 loss: 1.5674 grad: 1.39e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5951 data: 0.0973 lr: 5.22e-06 mem: 47% pow: 653.607 W 0: INFO 26-04-30 04:02:56.173224 - 12:27:36 - step: 46500 acc: 0 loss: 1.5731 grad: 1.41e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5793 data: 0.1101 lr: 5.21e-06 mem: 47% pow: 663.613 W 0: INFO 26-04-30 04:03:12.723747 - 12:27:53 - step: 46510 acc: 0 loss: 1.7657 grad: 1.41e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.7151 data: 0.0934 lr: 5.19e-06 mem: 54% pow: 594.233 W 0: INFO 26-04-30 04:03:26.468512 - 12:28:07 - step: 46520 acc: 0 loss: 1.9058 grad: 1.41e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5898 data: 0.0898 lr: 5.18e-06 mem: 47% pow: 662.731 W 0: INFO 26-04-30 04:03:39.919333 - 12:28:20 - step: 46530 acc: 0 loss: 1.3201 grad: 1.40e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5992 data: 0.0884 lr: 5.16e-06 mem: 47% pow: 661.038 W 0: INFO 26-04-30 04:03:53.439016 - 12:28:34 - step: 46540 acc: 0 loss: 1.5826 grad: 1.38e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6042 data: 0.0885 lr: 5.15e-06 mem: 47% pow: 652.486 W 0: INFO 26-04-30 04:04:06.824332 - 12:28:47 - step: 46550 acc: 0 loss: 1.7849 grad: 1.40e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5884 data: 0.0871 lr: 5.14e-06 mem: 47% pow: 663.271 W 0: INFO 26-04-30 04:04:20.454223 - 12:29:01 - step: 46560 acc: 0 loss: 1.1712 grad: 1.45e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6104 data: 0.0836 lr: 5.12e-06 mem: 47% pow: 643.778 W 0: INFO 26-04-30 04:04:34.086256 - 12:29:14 - step: 46570 acc: 0 loss: 1.5708 grad: 1.38e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6015 data: 0.079 lr: 5.11e-06 mem: 47% pow: 660.691 W 0: INFO 26-04-30 04:04:47.567116 - 12:29:28 - step: 46580 acc: 0 loss: 1.6498 grad: 1.40e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5921 data: 0.0875 lr: 5.09e-06 mem: 47% pow: 658.234 W 0: INFO 26-04-30 04:05:01.239655 - 12:29:42 - step: 46590 acc: 0 loss: 1.3956 grad: 1.36e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6231 data: 0.0869 lr: 5.08e-06 mem: 47% pow: 659.906 W 0: INFO 26-04-30 04:05:15.006884 - 12:29:55 - step: 46600 acc: 0 loss: 1.5005 grad: 1.79e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6073 data: 0.0872 lr: 5.06e-06 mem: 47% pow: 648.52 W 0: INFO 26-04-30 04:05:31.633927 - 12:30:12 - step: 46610 acc: 0 loss: 1.5063 grad: 1.53e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.5799 data: 0.0893 lr: 5.05e-06 mem: 54% pow: 668.342 W 0: INFO 26-04-30 04:05:45.123189 - 12:30:25 - step: 46620 acc: 0 loss: 1.2888 grad: 1.48e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6298 data: 0.0789 lr: 5.03e-06 mem: 47% pow: 654.316 W 0: INFO 26-04-30 04:05:58.600008 - 12:30:39 - step: 46630 acc: 0 loss: 1.5692 grad: 1.44e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.588 data: 0.0988 lr: 5.02e-06 mem: 47% pow: 662.795 W 0: INFO 26-04-30 04:06:12.027322 - 12:30:52 - step: 46640 acc: 0 loss: 1.4305 grad: 1.43e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5972 data: 0.0786 lr: 5.00e-06 mem: 47% pow: 664.158 W 0: INFO 26-04-30 04:06:26.157934 - 12:31:06 - step: 46650 acc: 0 loss: 1.4379 grad: 1.42e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6371 data: 0.0845 lr: 4.99e-06 mem: 47% pow: 637.782 W 0: INFO 26-04-30 04:06:39.912955 - 12:31:20 - step: 46660 acc: 0 loss: 1.1234 grad: 1.42e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6379 data: 0.0891 lr: 4.97e-06 mem: 47% pow: 637.978 W 0: INFO 26-04-30 04:06:53.504144 - 12:31:34 - step: 46670 acc: 0 loss: 1.6118 grad: 1.44e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.7082 data: 0.0893 lr: 4.96e-06 mem: 47% pow: 593.531 W 0: INFO 26-04-30 04:07:07.029642 - 12:31:47 - step: 46680 acc: 0 loss: 1.731 grad: 1.45e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5828 data: 0.1406 lr: 4.94e-06 mem: 47% pow: 628.008 W 0: INFO 26-04-30 04:07:20.498926 - 12:32:01 - step: 46690 acc: 0 loss: 1.6176 grad: 1.45e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5855 data: 0.0851 lr: 4.93e-06 mem: 47% pow: 668.734 W 0: INFO 26-04-30 04:07:34.070261 - 12:32:14 - step: 46700 acc: 0 loss: 1.6126 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6125 data: 0.0813 lr: 4.91e-06 mem: 47% pow: 667.108 W 0: INFO 26-04-30 04:07:50.602657 - 12:32:31 - step: 46710 acc: 0 loss: 1.4468 grad: 1.45e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.6105 data: 0.09 lr: 4.90e-06 mem: 54% pow: 661.286 W 0: INFO 26-04-30 04:08:04.177379 - 12:32:44 - step: 46720 acc: 0 loss: 1.5897 grad: 1.50e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6025 data: 0.0826 lr: 4.88e-06 mem: 47% pow: 662.196 W 0: INFO 26-04-30 04:08:17.746088 - 12:32:58 - step: 46730 acc: 0 loss: 1.3136 grad: 1.40e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6367 data: 0.0743 lr: 4.87e-06 mem: 47% pow: 654.367 W 0: INFO 26-04-30 04:08:31.505558 - 12:33:12 - step: 46740 acc: 0 loss: 1.4048 grad: 1.45e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5893 data: 0.0825 lr: 4.85e-06 mem: 47% pow: 662.975 W 0: INFO 26-04-30 04:08:44.973293 - 12:33:25 - step: 46750 acc: 0 loss: 1.7927 grad: 1.40e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5915 data: 0.0961 lr: 4.84e-06 mem: 47% pow: 669.279 W 0: INFO 26-04-30 04:08:59.985367 - 12:33:40 - step: 46760 acc: 0 loss: 1.6145 grad: 1.45e-01 flops: 3.77e+14 wps: 4.37e+04 iter: 0.5864 data: 0.1001 lr: 4.82e-06 mem: 47% pow: 662.727 W 0: INFO 26-04-30 04:09:13.577736 - 12:33:54 - step: 46770 acc: 0 loss: 1.7443 grad: 1.40e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5954 data: 0.0935 lr: 4.81e-06 mem: 47% pow: 668.751 W 0: INFO 26-04-30 04:09:27.275091 - 12:34:08 - step: 46780 acc: 0 loss: 1.3839 grad: 1.46e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5903 data: 0.0937 lr: 4.79e-06 mem: 47% pow: 664.312 W 0: INFO 26-04-30 04:09:40.666499 - 12:34:21 - step: 46790 acc: 0 loss: 1.4888 grad: 1.43e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5977 data: 0.0824 lr: 4.78e-06 mem: 47% pow: 665.145 W 0: INFO 26-04-30 04:09:54.135644 - 12:34:34 - step: 46800 acc: 0 loss: 1.1627 grad: 1.43e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.5957 data: 0.0885 lr: 4.76e-06 mem: 47% pow: 662.324 W 0: INFO 26-04-30 04:10:10.725497 - 12:34:51 - step: 46810 acc: 0 loss: 1.6756 grad: 1.45e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6064 data: 0.0927 lr: 4.75e-06 mem: 54% pow: 640.553 W 0: INFO 26-04-30 04:10:24.091544 - 12:35:04 - step: 46820 acc: 0 loss: 1.3354 grad: 1.44e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5958 data: 0.086 lr: 4.73e-06 mem: 47% pow: 658.554 W 0: INFO 26-04-30 04:10:37.698791 - 12:35:18 - step: 46830 acc: 0 loss: 1.4714 grad: 1.39e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5901 data: 0.0929 lr: 4.72e-06 mem: 47% pow: 657.397 W 0: INFO 26-04-30 04:10:51.287996 - 12:35:32 - step: 46840 acc: 0 loss: 1.5685 grad: 1.42e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5904 data: 0.0909 lr: 4.70e-06 mem: 47% pow: 657.708 W 0: INFO 26-04-30 04:11:04.770295 - 12:35:45 - step: 46850 acc: 0 loss: 1.8586 grad: 1.45e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6404 data: 0.0839 lr: 4.69e-06 mem: 47% pow: 638.084 W 0: INFO 26-04-30 04:11:18.180595 - 12:35:58 - step: 46860 acc: 0 loss: 1.4191 grad: 1.44e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.5921 data: 0.0887 lr: 4.67e-06 mem: 47% pow: 656.706 W 0: INFO 26-04-30 04:11:31.862577 - 12:36:12 - step: 46870 acc: 0 loss: 1.4145 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6004 data: 0.0869 lr: 4.66e-06 mem: 47% pow: 656.989 W 0: INFO 26-04-30 04:11:45.535800 - 12:36:26 - step: 46880 acc: 0 loss: 1.4521 grad: 1.39e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5915 data: 0.0922 lr: 4.64e-06 mem: 47% pow: 662.161 W 0: INFO 26-04-30 04:11:59.078784 - 12:36:39 - step: 46890 acc: 0 loss: 1.6321 grad: 1.44e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5982 data: 0.0912 lr: 4.63e-06 mem: 47% pow: 652.154 W 0: INFO 26-04-30 04:12:12.637659 - 12:36:53 - step: 46900 acc: 0 loss: 1.4438 grad: 1.43e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5957 data: 0.0908 lr: 4.61e-06 mem: 47% pow: 669.132 W 0: INFO 26-04-30 04:12:29.213486 - 12:37:10 - step: 46910 acc: 0 loss: 1.435 grad: 1.42e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6292 data: 0.0906 lr: 4.60e-06 mem: 54% pow: 635.237 W 0: INFO 26-04-30 04:12:42.955480 - 12:37:23 - step: 46920 acc: 0 loss: 1.4672 grad: 1.38e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6323 data: 0.0904 lr: 4.58e-06 mem: 47% pow: 639.394 W 0: INFO 26-04-30 04:12:56.734057 - 12:37:37 - step: 46930 acc: 0 loss: 1.6362 grad: 1.44e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5986 data: 0.0881 lr: 4.57e-06 mem: 47% pow: 658.376 W 0: INFO 26-04-30 04:13:11.494264 - 12:37:52 - step: 46940 acc: 0 loss: 1.2509 grad: 1.43e-01 flops: 3.83e+14 wps: 4.44e+04 iter: 0.5979 data: 0.0885 lr: 4.55e-06 mem: 47% pow: 665.274 W 0: INFO 26-04-30 04:13:25.073887 - 12:38:05 - step: 46950 acc: 0 loss: 1.3576 grad: 1.44e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6057 data: 0.0929 lr: 4.54e-06 mem: 47% pow: 654.449 W 0: INFO 26-04-30 04:13:38.558355 - 12:38:19 - step: 46960 acc: 0 loss: 1.3794 grad: 1.46e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.6022 data: 0.0829 lr: 4.53e-06 mem: 47% pow: 665.492 W 0: INFO 26-04-30 04:13:52.506384 - 12:38:33 - step: 46970 acc: 0 loss: 1.7498 grad: 1.40e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6726 data: 0.0032 lr: 4.51e-06 mem: 47% pow: 662.534 W 0: INFO 26-04-30 04:14:06.058007 - 12:38:46 - step: 46980 acc: 0 loss: 1.4009 grad: 1.41e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6535 data: 0.0524 lr: 4.50e-06 mem: 47% pow: 655.404 W 0: INFO 26-04-30 04:14:19.569936 - 12:39:00 - step: 46990 acc: 0 loss: 1.7023 grad: 1.43e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5879 data: 0.0935 lr: 4.48e-06 mem: 47% pow: 667.413 W 0: INFO 26-04-30 04:14:33.153612 - 12:39:13 - step: 47000 acc: 0 loss: 1.6301 grad: 1.42e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5883 data: 0.0907 lr: 4.47e-06 mem: 47% pow: 663.173 W 0: INFO 26-04-30 04:14:36.833966 - 12:39:17 - garbage collection 0: INFO 26-04-30 04:14:51.409530 - 12:39:32 - step: 47010 acc: 0 loss: 1.7106 grad: 1.40e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.5873 data: 0.0918 lr: 4.45e-06 mem: 54% pow: 660.554 W 0: INFO 26-04-30 04:15:05.786824 - 12:39:46 - step: 47020 acc: 0 loss: 1.1409 grad: 1.43e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5942 data: 0.0963 lr: 4.44e-06 mem: 47% pow: 657.342 W 0: INFO 26-04-30 04:15:19.338811 - 12:40:00 - step: 47030 acc: 0 loss: 1.6659 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6246 data: 0.0643 lr: 4.42e-06 mem: 47% pow: 667.026 W 0: INFO 26-04-30 04:15:32.797664 - 12:40:13 - step: 47040 acc: 0 loss: 1.4323 grad: 1.45e-01 flops: 4.20e+14 wps: 4.87e+04 iter: 0.5967 data: 0.0749 lr: 4.41e-06 mem: 47% pow: 679.234 W 0: INFO 26-04-30 04:15:47.196932 - 12:40:27 - step: 47050 acc: 0 loss: 1.4988 grad: 1.41e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5923 data: 0.0856 lr: 4.39e-06 mem: 47% pow: 671.684 W 0: INFO 26-04-30 04:16:03.706401 - 12:40:44 - step: 47060 acc: 0 loss: 1.3731 grad: 1.42e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.577 data: 0.0934 lr: 4.38e-06 mem: 47% pow: 671.667 W 0: INFO 26-04-30 04:16:17.110623 - 12:40:57 - step: 47070 acc: 0 loss: 1.4105 grad: 1.40e-01 flops: 4.21e+14 wps: 4.89e+04 iter: 0.5961 data: 0.0839 lr: 4.36e-06 mem: 47% pow: 667.103 W 0: INFO 26-04-30 04:16:30.715402 - 12:41:11 - step: 47080 acc: 0 loss: 1.6126 grad: 1.41e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.592 data: 0.094 lr: 4.35e-06 mem: 47% pow: 658.378 W 0: INFO 26-04-30 04:16:44.282245 - 12:41:25 - step: 47090 acc: 0 loss: 1.183 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5793 data: 0.0995 lr: 4.33e-06 mem: 47% pow: 659.68 W 0: INFO 26-04-30 04:16:57.929587 - 12:41:38 - step: 47100 acc: 0 loss: 1.5625 grad: 1.43e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5898 data: 0.0823 lr: 4.32e-06 mem: 47% pow: 665.187 W 0: INFO 26-04-30 04:17:14.752748 - 12:41:55 - step: 47110 acc: 0 loss: 1.8311 grad: 1.47e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.5999 data: 0.0832 lr: 4.30e-06 mem: 54% pow: 660.532 W 0: INFO 26-04-30 04:17:28.794471 - 12:42:09 - step: 47120 acc: 0 loss: 1.375 grad: 1.46e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.8573 data: 0.0797 lr: 4.29e-06 mem: 47% pow: 519.53 W 0: INFO 26-04-30 04:17:42.159965 - 12:42:22 - step: 47130 acc: 0 loss: 1.2959 grad: 1.48e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5959 data: 0.0896 lr: 4.27e-06 mem: 47% pow: 653.286 W 0: INFO 26-04-30 04:17:55.677786 - 12:42:36 - step: 47140 acc: 0 loss: 1.8688 grad: 1.46e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5804 data: 0.137 lr: 4.26e-06 mem: 47% pow: 643.226 W 0: INFO 26-04-30 04:18:10.497750 - 12:42:51 - step: 47150 acc: 0 loss: 1.9705 grad: 1.48e-01 flops: 3.81e+14 wps: 4.42e+04 iter: 0.6386 data: 0.0876 lr: 4.24e-06 mem: 47% pow: 638.395 W 0: INFO 26-04-30 04:18:24.119773 - 12:43:04 - step: 47160 acc: 0 loss: 1.7289 grad: 1.46e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5948 data: 0.0826 lr: 4.23e-06 mem: 47% pow: 690.841 W 0: INFO 26-04-30 04:18:37.709810 - 12:43:18 - step: 47170 acc: 0 loss: 1.7874 grad: 1.48e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5795 data: 0.1161 lr: 4.21e-06 mem: 47% pow: 655.944 W 0: INFO 26-04-30 04:18:51.608675 - 12:43:32 - step: 47180 acc: 0 loss: 1.6186 grad: 1.46e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6089 data: 0.0615 lr: 4.20e-06 mem: 47% pow: 674.002 W 0: INFO 26-04-30 04:19:05.703718 - 12:43:46 - step: 47190 acc: 0 loss: 1.5044 grad: 1.47e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5779 data: 0.1307 lr: 4.18e-06 mem: 47% pow: 640.075 W 0: INFO 26-04-30 04:19:19.527308 - 12:44:00 - step: 47200 acc: 0 loss: 1.4761 grad: 1.45e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6083 data: 0.082 lr: 4.17e-06 mem: 47% pow: 666.457 W 0: INFO 26-04-30 04:19:36.024189 - 12:44:16 - step: 47210 acc: 0 loss: 1.6826 grad: 1.46e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5795 data: 0.1129 lr: 4.15e-06 mem: 54% pow: 652.643 W 0: INFO 26-04-30 04:19:49.543139 - 12:44:30 - step: 47220 acc: 0 loss: 1.7423 grad: 1.45e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6134 data: 0.0925 lr: 4.14e-06 mem: 47% pow: 666.312 W 0: INFO 26-04-30 04:20:03.422166 - 12:44:44 - step: 47230 acc: 0 loss: 1.8564 grad: 1.51e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.6223 data: 0.0651 lr: 4.12e-06 mem: 47% pow: 659.756 W 0: INFO 26-04-30 04:20:17.661665 - 12:44:58 - step: 47240 acc: 0 loss: 1.5019 grad: 1.47e-01 flops: 3.97e+14 wps: 4.61e+04 iter: 0.6015 data: 0.0803 lr: 4.11e-06 mem: 47% pow: 658.822 W 0: INFO 26-04-30 04:20:31.310071 - 12:45:12 - step: 47250 acc: 0 loss: 1.4449 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6625 data: 0.0951 lr: 4.09e-06 mem: 47% pow: 616.034 W 0: INFO 26-04-30 04:20:45.349258 - 12:45:26 - step: 47260 acc: 0 loss: 1.4283 grad: 1.46e-01 flops: 4.03e+14 wps: 4.67e+04 iter: 0.6818 data: 0.0818 lr: 4.08e-06 mem: 47% pow: 623.627 W 0: INFO 26-04-30 04:20:59.138778 - 12:45:39 - step: 47270 acc: 0 loss: 1.5485 grad: 1.47e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.5852 data: 0.1002 lr: 4.06e-06 mem: 47% pow: 663.915 W 0: INFO 26-04-30 04:21:12.718823 - 12:45:53 - step: 47280 acc: 0 loss: 1.6692 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6194 data: 0.0836 lr: 4.05e-06 mem: 47% pow: 646.638 W 0: INFO 26-04-30 04:21:28.033866 - 12:46:08 - step: 47290 acc: 0 loss: 1.6477 grad: 1.48e-01 flops: 3.69e+14 wps: 4.28e+04 iter: 0.7318 data: 0.087 lr: 4.03e-06 mem: 47% pow: 589.532 W 0: INFO 26-04-30 04:21:41.657506 - 12:46:22 - step: 47300 acc: 0 loss: 1.6823 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5776 data: 0.1458 lr: 4.02e-06 mem: 47% pow: 637.381 W 0: INFO 26-04-30 04:21:58.641438 - 12:46:39 - step: 47310 acc: 0 loss: 1.6751 grad: 1.46e-01 flops: 3.33e+14 wps: 3.86e+04 iter: 0.6368 data: 0.089 lr: 4.00e-06 mem: 54% pow: 638.809 W 0: INFO 26-04-30 04:22:12.372957 - 12:46:53 - step: 47320 acc: 0 loss: 1.5436 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6094 data: 0.0847 lr: 3.99e-06 mem: 47% pow: 648.945 W 0: INFO 26-04-30 04:22:26.044578 - 12:47:06 - step: 47330 acc: 0 loss: 1.5916 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6326 data: 0.0769 lr: 3.97e-06 mem: 47% pow: 650.741 W 0: INFO 26-04-30 04:22:39.618152 - 12:47:20 - step: 47340 acc: 0 loss: 1.5508 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6136 data: 0.089 lr: 3.96e-06 mem: 47% pow: 649.113 W 0: INFO 26-04-30 04:22:53.321286 - 12:47:34 - step: 47350 acc: 0 loss: 1.3353 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6008 data: 0.0829 lr: 3.94e-06 mem: 47% pow: 668.042 W 0: INFO 26-04-30 04:23:06.960567 - 12:47:47 - step: 47360 acc: 0 loss: 1.5363 grad: 1.42e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5944 data: 0.0879 lr: 3.93e-06 mem: 47% pow: 661.281 W 0: INFO 26-04-30 04:23:20.513200 - 12:48:01 - step: 47370 acc: 0 loss: 1.3097 grad: 1.42e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6049 data: 0.0897 lr: 3.91e-06 mem: 47% pow: 652.399 W 0: INFO 26-04-30 04:23:34.720209 - 12:48:15 - step: 47380 acc: 0 loss: 1.7458 grad: 1.48e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5884 data: 0.0913 lr: 3.90e-06 mem: 47% pow: 665.773 W 0: INFO 26-04-30 04:23:48.221351 - 12:48:29 - step: 47390 acc: 0 loss: 1.6968 grad: 1.43e-01 flops: 4.18e+14 wps: 4.86e+04 iter: 0.6032 data: 0.0838 lr: 3.89e-06 mem: 47% pow: 665.773 W 0: INFO 26-04-30 04:24:01.783623 - 12:48:42 - step: 47400 acc: 0 loss: 1.3057 grad: 1.44e-01 flops: 4.17e+14 wps: 4.83e+04 iter: 0.5971 data: 0.0907 lr: 3.87e-06 mem: 47% pow: 657.956 W 0: INFO 26-04-30 04:24:18.815437 - 12:48:59 - step: 47410 acc: 0 loss: 1.7632 grad: 1.57e-01 flops: 3.32e+14 wps: 3.85e+04 iter: 0.5781 data: 0.1151 lr: 3.86e-06 mem: 54% pow: 660.524 W 0: INFO 26-04-30 04:24:32.574290 - 12:49:13 - step: 47420 acc: 0 loss: 1.4665 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6131 data: 0.0854 lr: 3.84e-06 mem: 47% pow: 650.312 W 0: INFO 26-04-30 04:24:46.464854 - 12:49:27 - step: 47430 acc: 0 loss: 1.5152 grad: 1.46e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5768 data: 0.1315 lr: 3.83e-06 mem: 47% pow: 650.63 W 0: INFO 26-04-30 04:25:00.195047 - 12:49:40 - step: 47440 acc: 0 loss: 1.7083 grad: 1.46e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6063 data: 0.0948 lr: 3.81e-06 mem: 47% pow: 646.591 W 0: INFO 26-04-30 04:25:14.128677 - 12:49:54 - step: 47450 acc: 0 loss: 1.7311 grad: 1.46e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5976 data: 0.0842 lr: 3.80e-06 mem: 47% pow: 680.186 W 0: INFO 26-04-30 04:25:27.998655 - 12:50:08 - step: 47460 acc: 0 loss: 1.5637 grad: 1.48e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6204 data: 0.0857 lr: 3.78e-06 mem: 47% pow: 650.022 W 0: INFO 26-04-30 04:25:41.567380 - 12:50:22 - step: 47470 acc: 0 loss: 1.3777 grad: 1.46e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5936 data: 0.0925 lr: 3.77e-06 mem: 47% pow: 660.487 W 0: INFO 26-04-30 04:25:55.355050 - 12:50:36 - step: 47480 acc: 0 loss: 1.6501 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5848 data: 0.093 lr: 3.75e-06 mem: 47% pow: 660.75 W 0: INFO 26-04-30 04:26:09.190964 - 12:50:49 - step: 47490 acc: 0 loss: 1.7381 grad: 1.43e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5782 data: 0.0905 lr: 3.74e-06 mem: 47% pow: 669.619 W 0: INFO 26-04-30 04:26:22.852644 - 12:51:03 - step: 47500 acc: 0 loss: 1.6038 grad: 1.50e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5906 data: 0.0918 lr: 3.72e-06 mem: 47% pow: 678.88 W 0: INFO 26-04-30 04:26:39.449751 - 12:51:20 - step: 47510 acc: 0 loss: 1.3759 grad: 1.45e-01 flops: 3.40e+14 wps: 3.95e+04 iter: 0.6033 data: 0.093 lr: 3.71e-06 mem: 54% pow: 648.152 W 0: INFO 26-04-30 04:26:52.974473 - 12:51:33 - step: 47520 acc: 0 loss: 1.4932 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5965 data: 0.0819 lr: 3.69e-06 mem: 47% pow: 660.835 W 0: INFO 26-04-30 04:27:06.440176 - 12:51:47 - step: 47530 acc: 0 loss: 1.4291 grad: 1.44e-01 flops: 4.19e+14 wps: 4.87e+04 iter: 0.6007 data: 0.0883 lr: 3.68e-06 mem: 47% pow: 658.69 W 0: INFO 26-04-30 04:27:20.028494 - 12:52:00 - step: 47540 acc: 0 loss: 1.6242 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6556 data: 0.0901 lr: 3.66e-06 mem: 47% pow: 618.626 W 0: INFO 26-04-30 04:27:33.590816 - 12:52:14 - step: 47550 acc: 0 loss: 1.8034 grad: 1.44e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5877 data: 0.0902 lr: 3.65e-06 mem: 47% pow: 661.869 W 0: INFO 26-04-30 04:27:47.357797 - 12:52:28 - step: 47560 acc: 0 loss: 1.4546 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5933 data: 0.0876 lr: 3.63e-06 mem: 47% pow: 660.092 W 0: INFO 26-04-30 04:28:01.018920 - 12:52:41 - step: 47570 acc: 0 loss: 1.6334 grad: 1.46e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6304 data: 0.0879 lr: 3.62e-06 mem: 47% pow: 637.137 W 0: INFO 26-04-30 04:28:14.581511 - 12:52:55 - step: 47580 acc: 0 loss: 1.5492 grad: 1.45e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5999 data: 0.0892 lr: 3.60e-06 mem: 47% pow: 652.668 W 0: INFO 26-04-30 04:28:28.305355 - 12:53:09 - step: 47590 acc: 0 loss: 1.5604 grad: 1.43e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5948 data: 0.0949 lr: 3.59e-06 mem: 47% pow: 674.263 W 0: INFO 26-04-30 04:28:42.098882 - 12:53:22 - step: 47600 acc: 0 loss: 1.1505 grad: 1.51e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.589 data: 0.0967 lr: 3.57e-06 mem: 47% pow: 664.174 W 0: INFO 26-04-30 04:28:58.754295 - 12:53:39 - step: 47610 acc: 0 loss: 1.4264 grad: 1.49e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.6035 data: 0.091 lr: 3.56e-06 mem: 54% pow: 650.049 W 0: INFO 26-04-30 04:29:12.692808 - 12:53:53 - step: 47620 acc: 0 loss: 1.7661 grad: 1.51e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6181 data: 0.0815 lr: 3.54e-06 mem: 47% pow: 648.502 W 0: INFO 26-04-30 04:29:26.391461 - 12:54:07 - step: 47630 acc: 0 loss: 1.7015 grad: 1.49e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6728 data: 0.0862 lr: 3.53e-06 mem: 47% pow: 615.344 W 0: INFO 26-04-30 04:29:40.124237 - 12:54:20 - step: 47640 acc: 0 loss: 1.4395 grad: 1.49e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5969 data: 0.0918 lr: 3.51e-06 mem: 47% pow: 666.183 W 0: INFO 26-04-30 04:29:54.410313 - 12:54:35 - step: 47650 acc: 0 loss: 1.356 grad: 1.49e-01 flops: 3.95e+14 wps: 4.59e+04 iter: 0.7487 data: 0.0856 lr: 3.50e-06 mem: 47% pow: 573.641 W 0: INFO 26-04-30 04:30:08.171931 - 12:54:48 - step: 47660 acc: 0 loss: 1.6097 grad: 1.50e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5894 data: 0.0827 lr: 3.48e-06 mem: 47% pow: 673.747 W 0: INFO 26-04-30 04:30:21.837833 - 12:55:02 - step: 47670 acc: 0 loss: 1.4839 grad: 1.46e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5984 data: 0.0849 lr: 3.47e-06 mem: 47% pow: 663.58 W 0: INFO 26-04-30 04:30:35.584718 - 12:55:16 - step: 47680 acc: 0 loss: 1.7516 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6105 data: 0.0847 lr: 3.45e-06 mem: 47% pow: 654.587 W 0: INFO 26-04-30 04:30:49.515568 - 12:55:30 - step: 47690 acc: 0 loss: 1.6705 grad: 1.45e-01 flops: 4.05e+14 wps: 4.71e+04 iter: 0.5965 data: 0.0853 lr: 3.44e-06 mem: 47% pow: 657.709 W 0: INFO 26-04-30 04:31:03.337171 - 12:55:44 - step: 47700 acc: 0 loss: 1.6099 grad: 1.47e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6578 data: 0.0724 lr: 3.42e-06 mem: 47% pow: 638.66 W 0: INFO 26-04-30 04:31:20.122018 - 12:56:00 - step: 47710 acc: 0 loss: 1.9112 grad: 1.44e-01 flops: 3.36e+14 wps: 3.91e+04 iter: 0.7745 data: 0.0911 lr: 3.41e-06 mem: 54% pow: 562.627 W 0: INFO 26-04-30 04:31:33.842012 - 12:56:14 - step: 47720 acc: 0 loss: 1.2469 grad: 1.47e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.7077 data: 0.0728 lr: 3.39e-06 mem: 47% pow: 597.829 W 0: INFO 26-04-30 04:31:48.227418 - 12:56:29 - step: 47730 acc: 0 loss: 1.3013 grad: 1.47e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.5785 data: 0.0886 lr: 3.38e-06 mem: 47% pow: 670.027 W 0: INFO 26-04-30 04:32:01.959084 - 12:56:42 - step: 47740 acc: 0 loss: 1.598 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5827 data: 0.0848 lr: 3.36e-06 mem: 47% pow: 680.169 W 0: INFO 26-04-30 04:32:15.494807 - 12:56:56 - step: 47750 acc: 0 loss: 1.3287 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5836 data: 0.0927 lr: 3.35e-06 mem: 47% pow: 667.489 W 0: INFO 26-04-30 04:32:29.332324 - 12:57:10 - step: 47760 acc: 0 loss: 1.5224 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.61 data: 0.0881 lr: 3.33e-06 mem: 47% pow: 651.357 W 0: INFO 26-04-30 04:32:43.297913 - 12:57:24 - step: 47770 acc: 0 loss: 1.7942 grad: 1.50e-01 flops: 4.05e+14 wps: 4.69e+04 iter: 0.6165 data: 0.079 lr: 3.32e-06 mem: 47% pow: 645.985 W 0: INFO 26-04-30 04:32:58.247188 - 12:57:39 - step: 47780 acc: 0 loss: 1.5961 grad: 1.47e-01 flops: 3.78e+14 wps: 4.38e+04 iter: 1.4357 data: 0.0949 lr: 3.30e-06 mem: 47% pow: 466.858 W 0: INFO 26-04-30 04:33:11.853728 - 12:57:52 - step: 47790 acc: 0 loss: 1.4289 grad: 1.51e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6009 data: 0.0938 lr: 3.29e-06 mem: 47% pow: 649.202 W 0: INFO 26-04-30 04:33:25.691512 - 12:58:06 - step: 47800 acc: 0 loss: 1.8064 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5815 data: 0.0963 lr: 3.28e-06 mem: 47% pow: 658.707 W 0: INFO 26-04-30 04:33:42.345392 - 12:58:23 - step: 47810 acc: 0 loss: 1.4879 grad: 1.46e-01 flops: 3.39e+14 wps: 3.94e+04 iter: 0.5887 data: 0.0888 lr: 3.26e-06 mem: 54% pow: 663.721 W 0: INFO 26-04-30 04:33:56.044470 - 12:58:36 - step: 47820 acc: 0 loss: 1.34 grad: 1.49e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5977 data: 0.0911 lr: 3.25e-06 mem: 47% pow: 661.684 W 0: INFO 26-04-30 04:34:09.746724 - 12:58:50 - step: 47830 acc: 0 loss: 1.5184 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5831 data: 0.0891 lr: 3.23e-06 mem: 47% pow: 672.456 W 0: INFO 26-04-30 04:34:23.689726 - 12:59:04 - step: 47840 acc: 0 loss: 1.4409 grad: 1.47e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6283 data: 0.077 lr: 3.22e-06 mem: 47% pow: 651.646 W 0: INFO 26-04-30 04:34:38.087775 - 12:59:18 - step: 47850 acc: 0 loss: 1.4695 grad: 1.47e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6062 data: 0.0857 lr: 3.20e-06 mem: 47% pow: 647.69 W 0: INFO 26-04-30 04:34:51.917913 - 12:59:32 - step: 47860 acc: 0 loss: 1.6112 grad: 1.49e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.7506 data: 0.0836 lr: 3.19e-06 mem: 47% pow: 578.681 W 0: INFO 26-04-30 04:35:05.758123 - 12:59:46 - step: 47870 acc: 0 loss: 1.6292 grad: 1.45e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5827 data: 0.0976 lr: 3.17e-06 mem: 47% pow: 665.182 W 0: INFO 26-04-30 04:35:19.393888 - 13:00:00 - step: 47880 acc: 0 loss: 1.8282 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.585 data: 0.0922 lr: 3.16e-06 mem: 47% pow: 677.919 W 0: INFO 26-04-30 04:35:33.143505 - 13:00:13 - step: 47890 acc: 0 loss: 1.7294 grad: 1.47e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5815 data: 0.0928 lr: 3.14e-06 mem: 47% pow: 684.878 W 0: INFO 26-04-30 04:35:46.647214 - 13:00:27 - step: 47900 acc: 0 loss: 1.8147 grad: 1.47e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5931 data: 0.0886 lr: 3.13e-06 mem: 47% pow: 660.645 W 0: INFO 26-04-30 04:36:03.433160 - 13:00:44 - step: 47910 acc: 0 loss: 1.4994 grad: 1.47e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6152 data: 0.0824 lr: 3.11e-06 mem: 54% pow: 646.946 W 0: INFO 26-04-30 04:36:17.340057 - 13:00:58 - step: 47920 acc: 0 loss: 1.4728 grad: 1.77e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5813 data: 0.1026 lr: 3.10e-06 mem: 47% pow: 663.388 W 0: INFO 26-04-30 04:36:30.860055 - 13:01:11 - step: 47930 acc: 0 loss: 1.759 grad: 1.48e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6144 data: 0.0806 lr: 3.08e-06 mem: 47% pow: 651.247 W 0: INFO 26-04-30 04:36:44.430412 - 13:01:25 - step: 47940 acc: 0 loss: 1.3072 grad: 1.46e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6066 data: 0.0872 lr: 3.07e-06 mem: 47% pow: 655.266 W 0: INFO 26-04-30 04:36:58.236041 - 13:01:39 - step: 47950 acc: 0 loss: 1.5645 grad: 1.53e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.5954 data: 0.0726 lr: 3.05e-06 mem: 47% pow: 673.231 W 0: INFO 26-04-30 04:37:12.080141 - 13:01:52 - step: 47960 acc: 0 loss: 1.5842 grad: 1.43e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.639 data: 0.0857 lr: 3.04e-06 mem: 47% pow: 639.221 W 0: INFO 26-04-30 04:37:25.749440 - 13:02:06 - step: 47970 acc: 0 loss: 1.4676 grad: 1.46e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.602 data: 0.0832 lr: 3.02e-06 mem: 47% pow: 670.605 W 0: INFO 26-04-30 04:37:39.515823 - 13:02:20 - step: 47980 acc: 0 loss: 1.3832 grad: 1.48e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6459 data: 0.0892 lr: 3.01e-06 mem: 47% pow: 634.175 W 0: INFO 26-04-30 04:37:53.064303 - 13:02:33 - step: 47990 acc: 0 loss: 1.7003 grad: 1.46e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6067 data: 0.0733 lr: 2.99e-06 mem: 47% pow: 661.475 W 0: INFO 26-04-30 04:38:06.855757 - 13:02:47 - step: 48000 acc: 0 loss: 1.9084 grad: 1.51e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6227 data: 0.0873 lr: 2.98e-06 mem: 47% pow: 663.166 W 0: INFO 26-04-30 04:38:10.537619 - 13:02:51 - garbage collection 0: INFO 26-04-30 04:38:25.135523 - 13:03:05 - step: 48010 acc: 0 loss: 1.8945 grad: 1.45e-01 flops: 3.09e+14 wps: 3.59e+04 iter: 0.5798 data: 0.1179 lr: 2.96e-06 mem: 54% pow: 658.727 W 0: INFO 26-04-30 04:38:38.971879 - 13:03:19 - step: 48020 acc: 0 loss: 1.5372 grad: 1.47e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.5891 data: 0.0911 lr: 2.95e-06 mem: 47% pow: 658.366 W 0: INFO 26-04-30 04:38:52.543188 - 13:03:33 - step: 48030 acc: 0 loss: 1.5615 grad: 1.48e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.5957 data: 0.0871 lr: 2.93e-06 mem: 47% pow: 658.054 W 0: INFO 26-04-30 04:39:06.073182 - 13:03:46 - step: 48040 acc: 0 loss: 1.2981 grad: 1.46e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6213 data: 0.0832 lr: 2.92e-06 mem: 47% pow: 654.384 W 0: INFO 26-04-30 04:39:19.995081 - 13:04:00 - step: 48050 acc: 0 loss: 1.7933 grad: 1.45e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6221 data: 0.0756 lr: 2.90e-06 mem: 47% pow: 643.116 W 0: INFO 26-04-30 04:39:33.705740 - 13:04:14 - step: 48060 acc: 0 loss: 1.5295 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6205 data: 0.0637 lr: 2.89e-06 mem: 47% pow: 659.81 W 0: INFO 26-04-30 04:39:47.406789 - 13:04:28 - step: 48070 acc: 0 loss: 1.8974 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5804 data: 0.1502 lr: 2.87e-06 mem: 47% pow: 630.782 W 0: INFO 26-04-30 04:40:01.326152 - 13:04:42 - step: 48080 acc: 0 loss: 1.4095 grad: 1.45e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6247 data: 0.082 lr: 2.86e-06 mem: 47% pow: 652.902 W 0: INFO 26-04-30 04:40:15.057780 - 13:04:55 - step: 48090 acc: 0 loss: 1.2612 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6042 data: 0.0864 lr: 2.84e-06 mem: 47% pow: 670.812 W 0: INFO 26-04-30 04:40:28.969089 - 13:05:09 - step: 48100 acc: 0 loss: 1.7842 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6314 data: 0.0815 lr: 2.83e-06 mem: 47% pow: 648.755 W 0: INFO 26-04-30 04:40:46.044798 - 13:05:26 - step: 48110 acc: 0 loss: 1.7071 grad: 1.43e-01 flops: 3.31e+14 wps: 3.84e+04 iter: 0.589 data: 0.0912 lr: 2.81e-06 mem: 54% pow: 658.687 W 0: INFO 26-04-30 04:41:00.222884 - 13:05:41 - step: 48120 acc: 0 loss: 1.5926 grad: 1.46e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.7476 data: 0.0771 lr: 2.80e-06 mem: 47% pow: 591.61 W 0: INFO 26-04-30 04:41:14.201847 - 13:05:54 - step: 48130 acc: 0 loss: 1.6496 grad: 1.62e-01 flops: 4.04e+14 wps: 4.69e+04 iter: 0.6022 data: 0.0758 lr: 2.78e-06 mem: 47% pow: 662.351 W 0: INFO 26-04-30 04:41:29.220969 - 13:06:10 - step: 48140 acc: 0 loss: 1.8334 grad: 1.51e-01 flops: 3.76e+14 wps: 4.36e+04 iter: 0.6177 data: 0.0854 lr: 2.77e-06 mem: 47% pow: 655.076 W 0: INFO 26-04-30 04:41:42.941689 - 13:06:23 - step: 48150 acc: 0 loss: 1.5472 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6196 data: 0.0813 lr: 2.75e-06 mem: 47% pow: 648.538 W 0: INFO 26-04-30 04:41:56.777742 - 13:06:37 - step: 48160 acc: 0 loss: 1.5474 grad: 1.44e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6153 data: 0.085 lr: 2.74e-06 mem: 47% pow: 651.134 W 0: INFO 26-04-30 04:42:10.497405 - 13:06:51 - step: 48170 acc: 0 loss: 1.8887 grad: 1.45e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5893 data: 0.088 lr: 2.72e-06 mem: 47% pow: 665.57 W 0: INFO 26-04-30 04:42:24.272469 - 13:07:05 - step: 48180 acc: 0 loss: 1.6733 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6008 data: 0.0843 lr: 2.71e-06 mem: 47% pow: 667.365 W 0: INFO 26-04-30 04:42:37.779824 - 13:07:18 - step: 48190 acc: 0 loss: 1.7189 grad: 1.47e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6297 data: 0.0897 lr: 2.69e-06 mem: 47% pow: 633.831 W 0: INFO 26-04-30 04:42:51.953918 - 13:07:32 - step: 48200 acc: 0 loss: 1.5994 grad: 1.47e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6228 data: 0.0871 lr: 2.68e-06 mem: 47% pow: 638.657 W 0: INFO 26-04-30 04:43:08.587105 - 13:07:49 - step: 48210 acc: 0 loss: 1.629 grad: 1.52e-01 flops: 3.40e+14 wps: 3.94e+04 iter: 0.6333 data: 0.0896 lr: 2.67e-06 mem: 54% pow: 641.079 W 0: INFO 26-04-30 04:43:22.410565 - 13:08:03 - step: 48220 acc: 0 loss: 2.2185 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6461 data: 0.0925 lr: 2.65e-06 mem: 47% pow: 620.628 W 0: INFO 26-04-30 04:43:36.287217 - 13:08:17 - step: 48230 acc: 0 loss: 1.6433 grad: 1.50e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6122 data: 0.0911 lr: 2.64e-06 mem: 47% pow: 652.243 W 0: INFO 26-04-30 04:43:50.482020 - 13:08:31 - step: 48240 acc: 0 loss: 1.828 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5967 data: 0.097 lr: 2.62e-06 mem: 47% pow: 647.915 W 0: INFO 26-04-30 04:44:04.536872 - 13:08:45 - step: 48250 acc: 0 loss: 1.3883 grad: 1.49e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6083 data: 0.0862 lr: 2.61e-06 mem: 47% pow: 657.751 W 0: INFO 26-04-30 04:44:18.059444 - 13:08:58 - step: 48260 acc: 0 loss: 1.3563 grad: 1.46e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.6262 data: 0.0606 lr: 2.59e-06 mem: 47% pow: 659.99 W 0: INFO 26-04-30 04:44:32.018016 - 13:09:12 - step: 48270 acc: 0 loss: 1.4298 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6544 data: 0.0852 lr: 2.58e-06 mem: 47% pow: 619.775 W 0: INFO 26-04-30 04:44:45.664993 - 13:09:26 - step: 48280 acc: 0 loss: 1.5382 grad: 1.47e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5901 data: 0.0945 lr: 2.56e-06 mem: 47% pow: 667.988 W 0: INFO 26-04-30 04:44:59.504009 - 13:09:40 - step: 48290 acc: 0 loss: 1.6415 grad: 1.45e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6162 data: 0.0876 lr: 2.55e-06 mem: 47% pow: 653.556 W 0: INFO 26-04-30 04:45:13.631315 - 13:09:54 - step: 48300 acc: 0 loss: 1.5387 grad: 1.48e-01 flops: 4.00e+14 wps: 4.64e+04 iter: 0.6594 data: 0.0692 lr: 2.53e-06 mem: 47% pow: 636.09 W 0: INFO 26-04-30 04:45:30.089035 - 13:10:10 - step: 48310 acc: 0 loss: 1.7106 grad: 1.51e-01 flops: 3.43e+14 wps: 3.98e+04 iter: 0.5877 data: 0.0941 lr: 2.52e-06 mem: 54% pow: 656.922 W 0: INFO 26-04-30 04:45:43.930129 - 13:10:24 - step: 48320 acc: 0 loss: 1.9386 grad: 1.56e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6017 data: 0.0904 lr: 2.50e-06 mem: 47% pow: 656.779 W 0: INFO 26-04-30 04:45:58.097878 - 13:10:38 - step: 48330 acc: 0 loss: 1.7008 grad: 1.46e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6345 data: 0.0815 lr: 2.49e-06 mem: 47% pow: 640.778 W 0: INFO 26-04-30 04:46:11.979264 - 13:10:52 - step: 48340 acc: 0 loss: 1.4381 grad: 1.51e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5995 data: 0.0909 lr: 2.47e-06 mem: 47% pow: 658.986 W 0: INFO 26-04-30 04:46:25.605967 - 13:11:06 - step: 48350 acc: 0 loss: 1.8718 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6159 data: 0.0809 lr: 2.46e-06 mem: 47% pow: 654.294 W 0: INFO 26-04-30 04:46:39.481472 - 13:11:20 - step: 48360 acc: 0 loss: 1.3887 grad: 1.48e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.6172 data: 0.1155 lr: 2.44e-06 mem: 47% pow: 636.247 W 0: INFO 26-04-30 04:46:53.346963 - 13:11:34 - step: 48370 acc: 0 loss: 1.4934 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.591 data: 0.094 lr: 2.43e-06 mem: 47% pow: 668.478 W 0: INFO 26-04-30 04:47:07.789541 - 13:11:48 - step: 48380 acc: 0 loss: 1.8768 grad: 1.45e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6068 data: 0.0972 lr: 2.41e-06 mem: 47% pow: 648.553 W 0: INFO 26-04-30 04:47:21.788852 - 13:12:02 - step: 48390 acc: 0 loss: 1.5734 grad: 1.47e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.6079 data: 0.0825 lr: 2.40e-06 mem: 47% pow: 664.111 W 0: INFO 26-04-30 04:47:36.137102 - 13:12:16 - step: 48400 acc: 0 loss: 1.5655 grad: 1.48e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.6347 data: 0.078 lr: 2.38e-06 mem: 47% pow: 642.731 W 0: INFO 26-04-30 04:47:52.659270 - 13:12:33 - step: 48410 acc: 0 loss: 1.385 grad: 1.48e-01 flops: 3.42e+14 wps: 3.97e+04 iter: 0.5879 data: 0.0911 lr: 2.37e-06 mem: 54% pow: 656.962 W 0: INFO 26-04-30 04:48:06.283966 - 13:12:47 - step: 48420 acc: 0 loss: 1.5872 grad: 1.49e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.5921 data: 0.0886 lr: 2.35e-06 mem: 47% pow: 658.875 W 0: INFO 26-04-30 04:48:20.147953 - 13:13:00 - step: 48430 acc: 0 loss: 1.4756 grad: 1.49e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5801 data: 0.1039 lr: 2.34e-06 mem: 47% pow: 666.488 W 0: INFO 26-04-30 04:48:33.822962 - 13:13:14 - step: 48440 acc: 0 loss: 1.4903 grad: 1.45e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.5983 data: 0.0961 lr: 2.32e-06 mem: 47% pow: 662.906 W 0: INFO 26-04-30 04:48:47.674285 - 13:13:28 - step: 48450 acc: 0 loss: 1.7558 grad: 1.47e-01 flops: 4.08e+14 wps: 4.73e+04 iter: 0.6171 data: 0.0895 lr: 2.31e-06 mem: 47% pow: 647.758 W 0: INFO 26-04-30 04:49:01.533768 - 13:13:42 - step: 48460 acc: 0 loss: 1.6642 grad: 1.48e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5949 data: 0.0785 lr: 2.29e-06 mem: 47% pow: 665.095 W 0: INFO 26-04-30 04:49:15.905016 - 13:13:56 - step: 48470 acc: 0 loss: 1.8896 grad: 1.47e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5868 data: 0.097 lr: 2.28e-06 mem: 47% pow: 661.545 W 0: INFO 26-04-30 04:49:29.947468 - 13:14:10 - step: 48480 acc: 0 loss: 1.6757 grad: 1.46e-01 flops: 4.02e+14 wps: 4.67e+04 iter: 0.6901 data: 0.0858 lr: 2.26e-06 mem: 47% pow: 624.223 W 0: INFO 26-04-30 04:49:43.718034 - 13:14:24 - step: 48490 acc: 0 loss: 2.0006 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5997 data: 0.0864 lr: 2.25e-06 mem: 47% pow: 663.083 W 0: INFO 26-04-30 04:49:58.099990 - 13:14:38 - step: 48500 acc: 0 loss: 1.2602 grad: 1.49e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 0.6407 data: 0.0773 lr: 2.23e-06 mem: 47% pow: 636.159 W 0: INFO 26-04-30 04:50:14.678627 - 13:14:55 - step: 48510 acc: 0 loss: 1.5246 grad: 1.46e-01 flops: 3.41e+14 wps: 3.95e+04 iter: 0.6159 data: 0.0791 lr: 2.22e-06 mem: 54% pow: 663.013 W 0: INFO 26-04-30 04:50:28.402303 - 13:15:09 - step: 48520 acc: 0 loss: 1.5802 grad: 1.50e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6209 data: 0.0783 lr: 2.20e-06 mem: 47% pow: 643.178 W 0: INFO 26-04-30 04:50:42.757260 - 13:15:23 - step: 48530 acc: 0 loss: 1.9144 grad: 1.44e-01 flops: 3.94e+14 wps: 4.57e+04 iter: 0.5958 data: 0.0895 lr: 2.19e-06 mem: 47% pow: 664.649 W 0: INFO 26-04-30 04:50:57.240671 - 13:15:38 - step: 48540 acc: 0 loss: 1.2729 grad: 1.45e-01 flops: 3.90e+14 wps: 4.53e+04 iter: 0.6338 data: 0.0873 lr: 2.17e-06 mem: 47% pow: 633.705 W 0: INFO 26-04-30 04:51:11.662626 - 13:15:52 - step: 48550 acc: 0 loss: 1.6803 grad: 1.45e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.5846 data: 0.0869 lr: 2.16e-06 mem: 47% pow: 689.335 W 0: INFO 26-04-30 04:51:25.445151 - 13:16:06 - step: 48560 acc: 0 loss: 1.4755 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5892 data: 0.0889 lr: 2.14e-06 mem: 47% pow: 663.975 W 0: INFO 26-04-30 04:51:39.287334 - 13:16:20 - step: 48570 acc: 0 loss: 2.0627 grad: 1.46e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5973 data: 0.0852 lr: 2.13e-06 mem: 47% pow: 664.009 W 0: INFO 26-04-30 04:51:53.113713 - 13:16:33 - step: 48580 acc: 0 loss: 1.5063 grad: 1.50e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6531 data: 0.0545 lr: 2.11e-06 mem: 47% pow: 643.557 W 0: INFO 26-04-30 04:52:06.946228 - 13:16:47 - step: 48590 acc: 0 loss: 1.5794 grad: 1.45e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.62 data: 0.0825 lr: 2.10e-06 mem: 47% pow: 652.936 W 0: INFO 26-04-30 04:52:20.689846 - 13:17:01 - step: 48600 acc: 0 loss: 1.7064 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6034 data: 0.0816 lr: 2.08e-06 mem: 47% pow: 662.443 W 0: INFO 26-04-30 04:52:37.499755 - 13:17:18 - step: 48610 acc: 0 loss: 1.4599 grad: 1.46e-01 flops: 3.36e+14 wps: 3.90e+04 iter: 0.6148 data: 0.0812 lr: 2.07e-06 mem: 54% pow: 663.079 W 0: INFO 26-04-30 04:52:51.151052 - 13:17:31 - step: 48620 acc: 0 loss: 1.7546 grad: 1.48e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.6268 data: 0.0629 lr: 2.05e-06 mem: 47% pow: 675.545 W 0: INFO 26-04-30 04:53:05.149165 - 13:17:45 - step: 48630 acc: 0 loss: 1.715 grad: 1.45e-01 flops: 4.03e+14 wps: 4.68e+04 iter: 0.5824 data: 0.0875 lr: 2.04e-06 mem: 47% pow: 672.309 W 0: INFO 26-04-30 04:53:18.865119 - 13:17:59 - step: 48640 acc: 0 loss: 1.6353 grad: 1.46e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5915 data: 0.0885 lr: 2.03e-06 mem: 47% pow: 657.604 W 0: INFO 26-04-30 04:53:32.940235 - 13:18:13 - step: 48650 acc: 0 loss: 1.6304 grad: 1.49e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.6129 data: 0.0816 lr: 2.01e-06 mem: 47% pow: 659.209 W 0: INFO 26-04-30 04:53:46.725506 - 13:18:27 - step: 48660 acc: 0 loss: 1.5231 grad: 1.48e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6211 data: 0.081 lr: 2.00e-06 mem: 47% pow: 640.825 W 0: INFO 26-04-30 04:54:00.304296 - 13:18:41 - step: 48670 acc: 0 loss: 1.6986 grad: 1.47e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6108 data: 0.0833 lr: 1.98e-06 mem: 47% pow: 660.176 W 0: INFO 26-04-30 04:54:14.558110 - 13:18:55 - step: 48680 acc: 0 loss: 1.5902 grad: 1.48e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.6336 data: 0.0825 lr: 1.97e-06 mem: 47% pow: 636.129 W 0: INFO 26-04-30 04:54:29.363300 - 13:19:10 - step: 48690 acc: 0 loss: 1.5227 grad: 1.64e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.5975 data: 0.0796 lr: 1.95e-06 mem: 47% pow: 667.303 W 0: INFO 26-04-30 04:54:43.227582 - 13:19:24 - step: 48700 acc: 0 loss: 1.724 grad: 1.53e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5937 data: 0.0932 lr: 1.94e-06 mem: 47% pow: 666.281 W 0: INFO 26-04-30 04:55:00.520646 - 13:19:41 - step: 48710 acc: 0 loss: 1.7504 grad: 1.47e-01 flops: 3.27e+14 wps: 3.79e+04 iter: 0.66 data: 0.0913 lr: 1.92e-06 mem: 54% pow: 625.299 W 0: INFO 26-04-30 04:55:14.338905 - 13:19:55 - step: 48720 acc: 0 loss: 1.579 grad: 1.48e-01 flops: 4.09e+14 wps: 4.74e+04 iter: 0.6121 data: 0.0841 lr: 1.91e-06 mem: 47% pow: 661.028 W 0: INFO 26-04-30 04:55:31.011269 - 13:20:11 - step: 48730 acc: 0 loss: 1.4766 grad: 1.47e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5801 data: 0.0889 lr: 1.89e-06 mem: 47% pow: 682.755 W 0: INFO 26-04-30 04:55:45.569999 - 13:20:26 - step: 48740 acc: 0 loss: 1.4007 grad: 1.56e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.6248 data: 0.06 lr: 1.88e-06 mem: 47% pow: 675.077 W 0: INFO 26-04-30 04:55:59.647355 - 13:20:40 - step: 48750 acc: 0 loss: 1.5731 grad: 1.47e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.7503 data: 0.09 lr: 1.86e-06 mem: 47% pow: 568.913 W 0: INFO 26-04-30 04:56:13.410992 - 13:20:54 - step: 48760 acc: 0 loss: 1.9361 grad: 1.44e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5965 data: 0.0904 lr: 1.85e-06 mem: 47% pow: 671.682 W 0: INFO 26-04-30 04:56:27.144431 - 13:21:07 - step: 48770 acc: 0 loss: 1.1795 grad: 1.45e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5807 data: 0.112 lr: 1.83e-06 mem: 47% pow: 659.285 W 0: INFO 26-04-30 04:56:41.059669 - 13:21:21 - step: 48780 acc: 0 loss: 1.3337 grad: 1.44e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6061 data: 0.0678 lr: 1.82e-06 mem: 47% pow: 670.609 W 0: INFO 26-04-30 04:56:55.166349 - 13:21:35 - step: 48790 acc: 0 loss: 1.0585 grad: 1.51e-01 flops: 4.00e+14 wps: 4.65e+04 iter: 0.7928 data: 0.0887 lr: 1.80e-06 mem: 47% pow: 546.104 W 0: INFO 26-04-30 04:57:09.043213 - 13:21:49 - step: 48800 acc: 0 loss: 1.6881 grad: 1.45e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5981 data: 0.0909 lr: 1.79e-06 mem: 47% pow: 658.665 W 0: INFO 26-04-30 04:57:25.787660 - 13:22:06 - step: 48810 acc: 0 loss: 1.5257 grad: 1.49e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.603 data: 0.0812 lr: 1.77e-06 mem: 54% pow: 660.877 W 0: INFO 26-04-30 04:57:39.735636 - 13:22:20 - step: 48820 acc: 0 loss: 1.5317 grad: 1.46e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.595 data: 0.1327 lr: 1.76e-06 mem: 47% pow: 634.137 W 0: INFO 26-04-30 04:57:53.881493 - 13:22:34 - step: 48830 acc: 0 loss: 1.5197 grad: 1.51e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.6316 data: 0.0863 lr: 1.74e-06 mem: 47% pow: 634.496 W 0: INFO 26-04-30 04:58:09.263474 - 13:22:50 - step: 48840 acc: 0 loss: 1.4803 grad: 1.50e-01 flops: 3.67e+14 wps: 4.26e+04 iter: 1.7341 data: 0.0912 lr: 1.73e-06 mem: 47% pow: 457.518 W 0: INFO 26-04-30 04:58:22.981817 - 13:23:03 - step: 48850 acc: 0 loss: 1.7397 grad: 1.53e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6726 data: 0.0772 lr: 1.71e-06 mem: 47% pow: 637.763 W 0: INFO 26-04-30 04:58:38.356335 - 13:23:19 - step: 48860 acc: 0 loss: 1.8021 grad: 1.46e-01 flops: 3.70e+14 wps: 4.30e+04 iter: 0.6725 data: 0.0036 lr: 1.70e-06 mem: 47% pow: 661.001 W 0: INFO 26-04-30 04:58:52.311223 - 13:23:33 - step: 48870 acc: 0 loss: 1.6212 grad: 1.48e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.7015 data: 0.085 lr: 1.68e-06 mem: 47% pow: 605.151 W 0: INFO 26-04-30 04:59:06.201086 - 13:23:46 - step: 48880 acc: 0 loss: 1.5781 grad: 1.45e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.7342 data: 0.0919 lr: 1.67e-06 mem: 47% pow: 588.467 W 0: INFO 26-04-30 04:59:20.475196 - 13:24:01 - step: 48890 acc: 0 loss: 1.8263 grad: 1.47e-01 flops: 3.96e+14 wps: 4.60e+04 iter: 0.5892 data: 0.0891 lr: 1.65e-06 mem: 47% pow: 672.662 W 0: INFO 26-04-30 04:59:34.110038 - 13:24:14 - step: 48900 acc: 0 loss: 1.6424 grad: 1.49e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5951 data: 0.0903 lr: 1.64e-06 mem: 47% pow: 664.382 W 0: INFO 26-04-30 04:59:50.688908 - 13:24:31 - step: 48910 acc: 0 loss: 1.8079 grad: 1.50e-01 flops: 3.41e+14 wps: 3.96e+04 iter: 0.6186 data: 0.0947 lr: 1.62e-06 mem: 54% pow: 649.842 W 0: INFO 26-04-30 05:00:04.350200 - 13:24:45 - step: 48920 acc: 0 loss: 1.4842 grad: 1.51e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6105 data: 0.0765 lr: 1.61e-06 mem: 47% pow: 663.389 W 0: INFO 26-04-30 05:00:18.003706 - 13:24:58 - step: 48930 acc: 0 loss: 1.4479 grad: 1.48e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6075 data: 0.0821 lr: 1.59e-06 mem: 47% pow: 662.501 W 0: INFO 26-04-30 05:00:32.371474 - 13:25:13 - step: 48940 acc: 0 loss: 1.7176 grad: 1.45e-01 flops: 3.93e+14 wps: 4.56e+04 iter: 1.1136 data: 0.0762 lr: 1.58e-06 mem: 47% pow: 461.564 W 0: INFO 26-04-30 05:00:45.923351 - 13:25:26 - step: 48950 acc: 0 loss: 1.839 grad: 1.49e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5794 data: 0.0946 lr: 1.56e-06 mem: 47% pow: 669.647 W 0: INFO 26-04-30 05:00:59.470124 - 13:25:40 - step: 48960 acc: 0 loss: 1.8949 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6176 data: 0.0691 lr: 1.55e-06 mem: 47% pow: 661.66 W 0: INFO 26-04-30 05:01:13.910543 - 13:25:54 - step: 48970 acc: 0 loss: 1.5121 grad: 1.53e-01 flops: 3.91e+14 wps: 4.54e+04 iter: 0.6209 data: 0.0837 lr: 1.53e-06 mem: 47% pow: 652.026 W 0: INFO 26-04-30 05:01:27.860681 - 13:26:08 - step: 48980 acc: 0 loss: 1.6126 grad: 1.56e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.6103 data: 0.0808 lr: 1.52e-06 mem: 47% pow: 667.348 W 0: INFO 26-04-30 05:01:42.263616 - 13:26:23 - step: 48990 acc: 0 loss: 1.7152 grad: 1.46e-01 flops: 3.92e+14 wps: 4.55e+04 iter: 0.6601 data: 0.0791 lr: 1.50e-06 mem: 47% pow: 624.744 W 0: INFO 26-04-30 05:01:56.468824 - 13:26:37 - step: 49000 acc: 0 loss: 1.9196 grad: 1.49e-01 flops: 3.98e+14 wps: 4.62e+04 iter: 0.5924 data: 0.0858 lr: 1.49e-06 mem: 47% pow: 659.825 W 0: INFO 26-04-30 05:02:01.792479 - 13:26:42 - garbage collection 0: INFO 26-04-30 05:02:16.389866 - 13:26:57 - step: 49010 acc: 0 loss: 1.8162 grad: 1.42e-01 flops: 2.83e+14 wps: 3.29e+04 iter: 0.5999 data: 0.0849 lr: 1.47e-06 mem: 54% pow: 662.902 W 0: INFO 26-04-30 05:02:30.125875 - 13:27:10 - step: 49020 acc: 0 loss: 1.8334 grad: 1.48e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5836 data: 0.1106 lr: 1.46e-06 mem: 47% pow: 650.579 W 0: INFO 26-04-30 05:02:43.888024 - 13:27:24 - step: 49030 acc: 0 loss: 1.5278 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6552 data: 0.0683 lr: 1.44e-06 mem: 47% pow: 640.451 W 0: INFO 26-04-30 05:02:57.535196 - 13:27:38 - step: 49040 acc: 0 loss: 1.7664 grad: 1.44e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5904 data: 0.093 lr: 1.43e-06 mem: 47% pow: 668.12 W 0: INFO 26-04-30 05:03:11.463347 - 13:27:52 - step: 49050 acc: 0 loss: 1.5258 grad: 1.48e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.6058 data: 0.0841 lr: 1.42e-06 mem: 47% pow: 661.582 W 0: INFO 26-04-30 05:03:25.309134 - 13:28:06 - step: 49060 acc: 0 loss: 1.4132 grad: 1.43e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.6301 data: 0.085 lr: 1.40e-06 mem: 47% pow: 646.288 W 0: INFO 26-04-30 05:03:39.169518 - 13:28:19 - step: 49070 acc: 0 loss: 1.6985 grad: 1.44e-01 flops: 4.07e+14 wps: 4.73e+04 iter: 0.5812 data: 0.101 lr: 1.39e-06 mem: 47% pow: 667.298 W 0: INFO 26-04-30 05:03:53.719784 - 13:28:34 - step: 49080 acc: 0 loss: 1.441 grad: 1.46e-01 flops: 3.88e+14 wps: 4.50e+04 iter: 0.5804 data: 0.9962 lr: 1.37e-06 mem: 47% pow: 470.411 W 0: INFO 26-04-30 05:04:07.198349 - 13:28:47 - step: 49090 acc: 0 loss: 1.1238 grad: 1.49e-01 flops: 4.19e+14 wps: 4.86e+04 iter: 0.5873 data: 0.0846 lr: 1.36e-06 mem: 47% pow: 671.638 W 0: INFO 26-04-30 05:04:23.092308 - 13:29:03 - step: 49100 acc: 0 loss: 1.5673 grad: 1.43e-01 flops: 3.55e+14 wps: 4.12e+04 iter: 0.7045 data: 0.082 lr: 1.34e-06 mem: 47% pow: 604.67 W 0: INFO 26-04-30 05:04:39.997091 - 13:29:20 - step: 49110 acc: 0 loss: 1.5814 grad: 1.52e-01 flops: 3.34e+14 wps: 3.88e+04 iter: 0.6377 data: 0.0894 lr: 1.33e-06 mem: 54% pow: 640.627 W 0: INFO 26-04-30 05:04:53.643475 - 13:29:34 - step: 49120 acc: 0 loss: 1.5025 grad: 1.49e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.6105 data: 0.0883 lr: 1.31e-06 mem: 47% pow: 653.367 W 0: INFO 26-04-30 05:05:07.323216 - 13:29:48 - step: 49130 acc: 0 loss: 1.605 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5941 data: 0.086 lr: 1.30e-06 mem: 47% pow: 660.524 W 0: INFO 26-04-30 05:05:20.985975 - 13:30:01 - step: 49140 acc: 0 loss: 1.562 grad: 1.43e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6147 data: 0.0671 lr: 1.28e-06 mem: 47% pow: 659.588 W 0: INFO 26-04-30 05:05:34.382227 - 13:30:15 - step: 49150 acc: 0 loss: 1.4956 grad: 1.49e-01 flops: 4.22e+14 wps: 4.90e+04 iter: 0.6009 data: 0.0785 lr: 1.27e-06 mem: 47% pow: 685.579 W 0: INFO 26-04-30 05:05:48.375294 - 13:30:29 - step: 49160 acc: 0 loss: 1.5934 grad: 1.47e-01 flops: 4.04e+14 wps: 4.68e+04 iter: 0.6223 data: 0.0867 lr: 1.25e-06 mem: 47% pow: 644.144 W 0: INFO 26-04-30 05:06:02.230937 - 13:30:43 - step: 49170 acc: 0 loss: 1.9188 grad: 1.50e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.625 data: 0.0842 lr: 1.24e-06 mem: 47% pow: 644.858 W 0: INFO 26-04-30 05:06:15.941450 - 13:30:56 - step: 49180 acc: 0 loss: 1.3406 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.5904 data: 0.0993 lr: 1.22e-06 mem: 47% pow: 657.502 W 0: INFO 26-04-30 05:06:36.260600 - 13:31:17 - step: 49190 acc: 0 loss: 1.836 grad: 1.53e-01 flops: 2.78e+14 wps: 3.23e+04 iter: 0.7056 data: 0.0036 lr: 1.21e-06 mem: 47% pow: 648.38 W 0: INFO 26-04-30 05:06:49.770001 - 13:31:30 - step: 49200 acc: 0 loss: 1.46 grad: 1.51e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.7132 data: 0.0038 lr: 1.19e-06 mem: 47% pow: 652.276 W 0: INFO 26-04-30 05:07:06.774343 - 13:31:47 - step: 49210 acc: 0 loss: 1.7689 grad: 1.52e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.6653 data: 0.0035 lr: 1.18e-06 mem: 54% pow: 672.497 W 0: INFO 26-04-30 05:07:20.465434 - 13:32:01 - step: 49220 acc: 0 loss: 1.114 grad: 1.51e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.6735 data: 0.0034 lr: 1.16e-06 mem: 47% pow: 665.127 W 0: INFO 26-04-30 05:07:34.185839 - 13:32:14 - step: 49230 acc: 0 loss: 1.5421 grad: 1.48e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6013 data: 0.0777 lr: 1.15e-06 mem: 47% pow: 659.212 W 0: INFO 26-04-30 05:07:48.463695 - 13:32:29 - step: 49240 acc: 0 loss: 1.3264 grad: 1.50e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.7126 data: 0.0031 lr: 1.13e-06 mem: 47% pow: 641.602 W 0: INFO 26-04-30 05:08:02.162071 - 13:32:42 - step: 49250 acc: 0 loss: 1.34 grad: 1.53e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.627 data: 0.0659 lr: 1.12e-06 mem: 47% pow: 652.14 W 0: INFO 26-04-30 05:08:15.993600 - 13:32:56 - step: 49260 acc: 0 loss: 1.7725 grad: 1.54e-01 flops: 4.08e+14 wps: 4.74e+04 iter: 0.5849 data: 0.081 lr: 1.10e-06 mem: 47% pow: 673.653 W 0: INFO 26-04-30 05:08:29.874486 - 13:33:10 - step: 49270 acc: 0 loss: 1.2566 grad: 1.54e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.598 data: 0.0891 lr: 1.09e-06 mem: 47% pow: 673.406 W 0: INFO 26-04-30 05:08:43.578023 - 13:33:24 - step: 49280 acc: 0 loss: 1.7979 grad: 1.52e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6068 data: 0.0849 lr: 1.07e-06 mem: 47% pow: 661.333 W 0: INFO 26-04-30 05:08:57.337766 - 13:33:38 - step: 49290 acc: 0 loss: 1.2148 grad: 1.49e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6032 data: 0.0845 lr: 1.06e-06 mem: 47% pow: 661.601 W 0: INFO 26-04-30 05:09:11.149750 - 13:33:51 - step: 49300 acc: 0 loss: 1.5716 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6365 data: 0.0839 lr: 1.04e-06 mem: 47% pow: 631.912 W 0: INFO 26-04-30 05:09:27.833870 - 13:34:08 - step: 49310 acc: 0 loss: 1.4466 grad: 1.49e-01 flops: 3.39e+14 wps: 3.93e+04 iter: 0.5991 data: 0.0838 lr: 1.03e-06 mem: 54% pow: 663.083 W 0: INFO 26-04-30 05:09:41.522180 - 13:34:22 - step: 49320 acc: 0 loss: 1.8916 grad: 1.52e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5906 data: 0.086 lr: 1.01e-06 mem: 47% pow: 661.987 W 0: INFO 26-04-30 05:09:55.417080 - 13:34:36 - step: 49330 acc: 0 loss: 1.8096 grad: 1.55e-01 flops: 4.06e+14 wps: 4.72e+04 iter: 0.6847 data: 0.0852 lr: 9.98e-07 mem: 47% pow: 610.981 W 0: INFO 26-04-30 05:10:09.071458 - 13:34:49 - step: 49340 acc: 0 loss: 1.3878 grad: 1.50e-01 flops: 4.14e+14 wps: 4.80e+04 iter: 0.5855 data: 0.0817 lr: 9.84e-07 mem: 47% pow: 684.539 W 0: INFO 26-04-30 05:10:22.846144 - 13:35:03 - step: 49350 acc: 0 loss: 1.513 grad: 1.51e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6133 data: 0.0834 lr: 9.69e-07 mem: 47% pow: 645.157 W 0: INFO 26-04-30 05:10:36.508136 - 13:35:17 - step: 49360 acc: 0 loss: 1.5594 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.595 data: 0.0827 lr: 9.54e-07 mem: 47% pow: 661.451 W 0: INFO 26-04-30 05:10:50.299359 - 13:35:31 - step: 49370 acc: 0 loss: 1.7113 grad: 1.51e-01 flops: 4.10e+14 wps: 4.75e+04 iter: 0.6164 data: 0.0692 lr: 9.39e-07 mem: 47% pow: 662.923 W 0: INFO 26-04-30 05:11:05.307937 - 13:35:46 - step: 49380 acc: 0 loss: 1.5626 grad: 1.51e-01 flops: 3.76e+14 wps: 4.37e+04 iter: 0.6172 data: 0.0794 lr: 9.24e-07 mem: 47% pow: 649.975 W 0: INFO 26-04-30 05:11:19.407481 - 13:36:00 - step: 49390 acc: 0 loss: 1.4684 grad: 1.48e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5939 data: 0.0842 lr: 9.09e-07 mem: 47% pow: 660.813 W 0: INFO 26-04-30 05:11:32.998357 - 13:36:13 - step: 49400 acc: 0 loss: 1.5992 grad: 1.47e-01 flops: 4.16e+14 wps: 4.82e+04 iter: 0.5991 data: 0.0876 lr: 8.94e-07 mem: 47% pow: 669.605 W 0: INFO 26-04-30 05:11:49.707768 - 13:36:30 - step: 49410 acc: 0 loss: 1.739 grad: 1.57e-01 flops: 3.38e+14 wps: 3.92e+04 iter: 0.6056 data: 0.0946 lr: 8.79e-07 mem: 54% pow: 651.139 W 0: INFO 26-04-30 05:12:03.810778 - 13:36:44 - step: 49420 acc: 0 loss: 1.5516 grad: 1.49e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.5875 data: 0.091 lr: 8.65e-07 mem: 47% pow: 658.138 W 0: INFO 26-04-30 05:12:17.419320 - 13:36:58 - step: 49430 acc: 0 loss: 1.3938 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5896 data: 0.0856 lr: 8.50e-07 mem: 47% pow: 677.955 W 0: INFO 26-04-30 05:12:31.151512 - 13:37:11 - step: 49440 acc: 0 loss: 1.2423 grad: 1.57e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5845 data: 0.1003 lr: 8.35e-07 mem: 47% pow: 663.317 W 0: INFO 26-04-30 05:12:44.841719 - 13:37:25 - step: 49450 acc: 0 loss: 1.4145 grad: 1.47e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6487 data: 0.104 lr: 8.20e-07 mem: 47% pow: 617.74 W 0: INFO 26-04-30 05:12:58.587420 - 13:37:39 - step: 49460 acc: 0 loss: 1.1893 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6119 data: 0.0751 lr: 8.05e-07 mem: 47% pow: 662.583 W 0: INFO 26-04-30 05:13:12.289618 - 13:37:53 - step: 49470 acc: 0 loss: 1.2123 grad: 1.50e-01 flops: 4.12e+14 wps: 4.79e+04 iter: 0.5904 data: 0.0896 lr: 7.90e-07 mem: 47% pow: 660.247 W 0: INFO 26-04-30 05:13:25.917539 - 13:38:06 - step: 49480 acc: 0 loss: 1.8278 grad: 1.48e-01 flops: 4.15e+14 wps: 4.81e+04 iter: 0.6103 data: 0.0773 lr: 7.75e-07 mem: 47% pow: 661.873 W 0: INFO 26-04-30 05:13:39.726320 - 13:38:20 - step: 49490 acc: 0 loss: 1.5299 grad: 1.52e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6089 data: 0.0889 lr: 7.60e-07 mem: 47% pow: 650.623 W 0: INFO 26-04-30 05:13:53.300301 - 13:38:34 - step: 49500 acc: 0 loss: 1.6767 grad: 1.51e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6119 data: 0.0788 lr: 7.45e-07 mem: 47% pow: 650.119 W 0: INFO 26-04-30 05:14:10.057379 - 13:38:50 - step: 49510 acc: 0 loss: 1.7398 grad: 1.47e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5864 data: 0.0944 lr: 7.31e-07 mem: 54% pow: 658.603 W 0: INFO 26-04-30 05:14:23.724828 - 13:39:04 - step: 49520 acc: 0 loss: 1.5313 grad: 1.50e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6069 data: 0.0916 lr: 7.16e-07 mem: 47% pow: 645.897 W 0: INFO 26-04-30 05:14:37.610159 - 13:39:18 - step: 49530 acc: 0 loss: 1.4263 grad: 1.53e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.5868 data: 0.0928 lr: 7.01e-07 mem: 47% pow: 665.761 W 0: INFO 26-04-30 05:14:51.226359 - 13:39:32 - step: 49540 acc: 0 loss: 0.8523 grad: 1.49e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.614 data: 0.102 lr: 6.86e-07 mem: 47% pow: 635.852 W 0: INFO 26-04-30 05:15:05.301084 - 13:39:46 - step: 49550 acc: 0 loss: 1.5355 grad: 1.50e-01 flops: 4.01e+14 wps: 4.66e+04 iter: 0.5886 data: 0.0899 lr: 6.71e-07 mem: 47% pow: 667.776 W 0: INFO 26-04-30 05:15:18.981063 - 13:39:59 - step: 49560 acc: 0 loss: 1.5437 grad: 1.46e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.6048 data: 0.0795 lr: 6.56e-07 mem: 47% pow: 657.945 W 0: INFO 26-04-30 05:15:32.725047 - 13:40:13 - step: 49570 acc: 0 loss: 1.7376 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5878 data: 0.0885 lr: 6.41e-07 mem: 47% pow: 662.258 W 0: INFO 26-04-30 05:15:46.257993 - 13:40:27 - step: 49580 acc: 0 loss: 1.4791 grad: 1.48e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.6023 data: 0.0846 lr: 6.26e-07 mem: 47% pow: 658.877 W 0: INFO 26-04-30 05:15:59.931669 - 13:40:40 - step: 49590 acc: 0 loss: 1.3107 grad: 1.53e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5897 data: 0.092 lr: 6.12e-07 mem: 47% pow: 656.996 W 0: INFO 26-04-30 05:16:13.546480 - 13:40:54 - step: 49600 acc: 0 loss: 1.6182 grad: 1.46e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.7073 data: 0.0918 lr: 5.97e-07 mem: 47% pow: 592.947 W 0: INFO 26-04-30 05:16:30.297468 - 13:41:11 - step: 49610 acc: 0 loss: 1.6854 grad: 1.47e-01 flops: 3.37e+14 wps: 3.91e+04 iter: 0.5987 data: 0.087 lr: 5.82e-07 mem: 54% pow: 673.864 W 0: INFO 26-04-30 05:16:44.041988 - 13:41:24 - step: 49620 acc: 0 loss: 1.4491 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5802 data: 0.1363 lr: 5.67e-07 mem: 47% pow: 644.017 W 0: INFO 26-04-30 05:16:57.854798 - 13:41:38 - step: 49630 acc: 0 loss: 1.0478 grad: 1.50e-01 flops: 4.09e+14 wps: 4.75e+04 iter: 0.6138 data: 0.0859 lr: 5.52e-07 mem: 47% pow: 642.352 W 0: INFO 26-04-30 05:17:11.741618 - 13:41:52 - step: 49640 acc: 0 loss: 1.2544 grad: 1.48e-01 flops: 4.07e+14 wps: 4.72e+04 iter: 0.733 data: 0.0887 lr: 5.37e-07 mem: 47% pow: 586.303 W 0: INFO 26-04-30 05:17:26.018252 - 13:42:06 - step: 49650 acc: 0 loss: 1.3072 grad: 1.45e-01 flops: 3.96e+14 wps: 4.59e+04 iter: 0.5911 data: 0.0934 lr: 5.22e-07 mem: 47% pow: 672.051 W 0: INFO 26-04-30 05:17:39.789815 - 13:42:20 - step: 49660 acc: 0 loss: 1.4165 grad: 1.47e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.5927 data: 0.0865 lr: 5.07e-07 mem: 47% pow: 665.738 W 0: INFO 26-04-30 05:17:53.467081 - 13:42:34 - step: 49670 acc: 0 loss: 1.3672 grad: 1.61e-01 flops: 4.13e+14 wps: 4.79e+04 iter: 0.5804 data: 0.1768 lr: 4.93e-07 mem: 47% pow: 620.196 W 0: INFO 26-04-30 05:18:07.051282 - 13:42:47 - step: 49680 acc: 0 loss: 1.4447 grad: 1.54e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.61 data: 0.093 lr: 4.78e-07 mem: 47% pow: 650.738 W 0: INFO 26-04-30 05:18:20.448040 - 13:43:01 - step: 49690 acc: 0 loss: 1.0368 grad: 1.50e-01 flops: 4.22e+14 wps: 4.89e+04 iter: 0.5908 data: 0.0898 lr: 4.63e-07 mem: 47% pow: 659.12 W 0: INFO 26-04-30 05:18:33.890942 - 13:43:14 - step: 49700 acc: 0 loss: 1.3329 grad: 1.51e-01 flops: 4.20e+14 wps: 4.88e+04 iter: 0.5946 data: 0.0848 lr: 4.48e-07 mem: 47% pow: 669.945 W 0: INFO 26-04-30 05:18:50.886745 - 13:43:31 - step: 49710 acc: 0 loss: 1.4453 grad: 1.54e-01 flops: 3.32e+14 wps: 3.86e+04 iter: 0.7358 data: 0.0796 lr: 4.33e-07 mem: 54% pow: 580.52 W 0: INFO 26-04-30 05:19:04.489338 - 13:43:45 - step: 49720 acc: 0 loss: 1.7858 grad: 1.55e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5821 data: 0.0954 lr: 4.18e-07 mem: 47% pow: 665.913 W 0: INFO 26-04-30 05:19:19.291392 - 13:44:00 - step: 49730 acc: 0 loss: 1.7604 grad: 1.59e-01 flops: 3.82e+14 wps: 4.43e+04 iter: 0.6281 data: 0.1254 lr: 4.03e-07 mem: 47% pow: 619.717 W 0: INFO 26-04-30 05:19:32.874250 - 13:44:13 - step: 49740 acc: 0 loss: 1.5395 grad: 1.61e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.601 data: 0.0839 lr: 3.88e-07 mem: 47% pow: 659.452 W 0: INFO 26-04-30 05:19:46.807597 - 13:44:27 - step: 49750 acc: 0 loss: 1.2032 grad: 1.49e-01 flops: 4.05e+14 wps: 4.70e+04 iter: 0.788 data: 0.0901 lr: 3.73e-07 mem: 47% pow: 555.034 W 0: INFO 26-04-30 05:20:00.563589 - 13:44:41 - step: 49760 acc: 0 loss: 1.6573 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5782 data: 0.1371 lr: 3.59e-07 mem: 47% pow: 646.904 W 0: INFO 26-04-30 05:20:14.177245 - 13:44:54 - step: 49770 acc: 0 loss: 1.2288 grad: 1.52e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.6252 data: 0.0774 lr: 3.44e-07 mem: 47% pow: 649.204 W 0: INFO 26-04-30 05:20:28.336763 - 13:45:09 - step: 49780 acc: 0 loss: 1.6063 grad: 1.60e-01 flops: 3.99e+14 wps: 4.63e+04 iter: 0.5991 data: 0.0896 lr: 3.29e-07 mem: 47% pow: 657.144 W 0: INFO 26-04-30 05:20:41.765341 - 13:45:22 - step: 49790 acc: 0 loss: 1.5097 grad: 1.54e-01 flops: 4.21e+14 wps: 4.88e+04 iter: 0.5962 data: 0.0938 lr: 3.14e-07 mem: 47% pow: 663.13 W 0: INFO 26-04-30 05:20:55.402998 - 13:45:36 - step: 49800 acc: 0 loss: 1.2333 grad: 1.55e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5952 data: 0.0888 lr: 2.99e-07 mem: 47% pow: 666.606 W 0: INFO 26-04-30 05:21:11.813598 - 13:45:52 - step: 49810 acc: 0 loss: 1.3873 grad: 1.52e-01 flops: 3.44e+14 wps: 4.00e+04 iter: 0.5892 data: 0.0904 lr: 2.84e-07 mem: 54% pow: 653.583 W 0: INFO 26-04-30 05:21:25.567952 - 13:46:06 - step: 49820 acc: 0 loss: 1.3635 grad: 1.52e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5898 data: 0.0962 lr: 2.69e-07 mem: 47% pow: 665.163 W 0: INFO 26-04-30 05:21:39.074650 - 13:46:19 - step: 49830 acc: 0 loss: 1.616 grad: 1.49e-01 flops: 4.18e+14 wps: 4.85e+04 iter: 0.5986 data: 0.0886 lr: 2.54e-07 mem: 47% pow: 662.456 W 0: INFO 26-04-30 05:21:52.744322 - 13:46:33 - step: 49840 acc: 0 loss: 1.9206 grad: 1.58e-01 flops: 4.13e+14 wps: 4.80e+04 iter: 0.6043 data: 0.0879 lr: 2.40e-07 mem: 47% pow: 660.151 W 0: INFO 26-04-30 05:22:06.058499 - 13:46:46 - step: 49850 acc: 0 loss: 1.6654 grad: 1.53e-01 flops: 4.24e+14 wps: 4.92e+04 iter: 0.5869 data: 0.0863 lr: 2.25e-07 mem: 47% pow: 678.083 W 0: INFO 26-04-30 05:22:19.767862 - 13:47:00 - step: 49860 acc: 0 loss: 1.4412 grad: 1.51e-01 flops: 4.12e+14 wps: 4.78e+04 iter: 0.6051 data: 0.0866 lr: 2.10e-07 mem: 47% pow: 652.061 W 0: INFO 26-04-30 05:22:33.852185 - 13:47:14 - step: 49870 acc: 0 loss: 1.4809 grad: 1.53e-01 flops: 4.01e+14 wps: 4.65e+04 iter: 0.6139 data: 0.0882 lr: 1.95e-07 mem: 47% pow: 659.987 W 0: INFO 26-04-30 05:22:47.405514 - 13:47:28 - step: 49880 acc: 0 loss: 2.1725 grad: 1.54e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5974 data: 0.093 lr: 1.80e-07 mem: 47% pow: 659.64 W 0: INFO 26-04-30 05:23:01.169570 - 13:47:41 - step: 49890 acc: 0 loss: 1.5235 grad: 1.51e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.6179 data: 0.0912 lr: 1.65e-07 mem: 47% pow: 652.717 W 0: INFO 26-04-30 05:23:14.727751 - 13:47:55 - step: 49900 acc: 0 loss: 1.2541 grad: 1.53e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.586 data: 0.0908 lr: 1.50e-07 mem: 47% pow: 663.686 W 0: INFO 26-04-30 05:23:31.472531 - 13:48:12 - step: 49910 acc: 0 loss: 1.4107 grad: 1.48e-01 flops: 3.37e+14 wps: 3.92e+04 iter: 0.6047 data: 0.0832 lr: 1.35e-07 mem: 54% pow: 658.881 W 0: INFO 26-04-30 05:23:45.106153 - 13:48:25 - step: 49920 acc: 0 loss: 1.5942 grad: 1.47e-01 flops: 4.14e+14 wps: 4.81e+04 iter: 0.5925 data: 0.0813 lr: 1.21e-07 mem: 47% pow: 662.408 W 0: INFO 26-04-30 05:23:58.705496 - 13:48:39 - step: 49930 acc: 0 loss: 1.432 grad: 1.53e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5857 data: 0.0867 lr: 1.06e-07 mem: 47% pow: 668.855 W 0: INFO 26-04-30 05:24:12.275348 - 13:48:53 - step: 49940 acc: 0 loss: 1.3482 grad: 1.53e-01 flops: 4.16e+14 wps: 4.83e+04 iter: 0.6004 data: 0.0849 lr: 9.08e-08 mem: 47% pow: 660.501 W 0: INFO 26-04-30 05:24:25.810931 - 13:49:06 - step: 49950 acc: 0 loss: 1.6936 grad: 1.50e-01 flops: 4.17e+14 wps: 4.84e+04 iter: 0.5785 data: 0.0963 lr: 7.59e-08 mem: 47% pow: 666.286 W 0: INFO 26-04-30 05:24:39.539481 - 13:49:20 - step: 49960 acc: 0 loss: 1.7351 grad: 1.53e-01 flops: 4.11e+14 wps: 4.77e+04 iter: 0.5834 data: 0.1052 lr: 6.10e-08 mem: 47% pow: 662.921 W 0: INFO 26-04-30 05:24:53.142978 - 13:49:33 - step: 49970 acc: 0 loss: 1.824 grad: 1.50e-01 flops: 4.15e+14 wps: 4.82e+04 iter: 0.5951 data: 0.0897 lr: 4.61e-08 mem: 47% pow: 663.228 W 0: INFO 26-04-30 05:25:07.056804 - 13:49:47 - step: 49980 acc: 0 loss: 1.6036 grad: 1.50e-01 flops: 4.06e+14 wps: 4.71e+04 iter: 0.5778 data: 0.0977 lr: 3.12e-08 mem: 47% pow: 685.858 W 0: INFO 26-04-30 05:25:20.405625 - 13:50:01 - step: 49990 acc: 0 loss: 1.2225 grad: 1.63e-01 flops: 4.23e+14 wps: 4.91e+04 iter: 0.5938 data: 0.0905 lr: 1.64e-08 mem: 47% pow: 661.752 W 0: INFO 26-04-30 05:25:34.181136 - 13:50:14 - step: 50000 acc: 0 loss: 1.3688 grad: 1.46e-01 flops: 4.10e+14 wps: 4.76e+04 iter: 0.6719 data: 0.0866 lr: 1.49e-09 mem: 47% pow: 609.672 W 0: INFO 26-04-30 05:25:34.185899 - 13:50:14 - Saving to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000050000 0: INFO 26-04-30 05:25:34.186444 - 13:50:14 - Saving... 0: INFO 26-04-30 05:25:40.196909 - 13:50:20 - State dict saved! 0: INFO 26-04-30 05:25:40.316134 - 13:50:21 - Saving train state to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000050000/train_state_00000.json 0: INFO 26-04-30 05:25:40.395231 - 13:50:21 - Train state saved ! 0: INFO 26-04-30 05:25:40.398738 - 13:50:21 - Cleaning up checkpoints... 0: INFO 26-04-30 05:25:40.399370 - 13:50:21 - Dump folders: [PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000045000'), PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000050000')] 0: INFO 26-04-30 05:25:40.399748 - 13:50:21 - Eval folders: [] 0: INFO 26-04-30 05:25:40.400097 - 13:50:21 - Other folders: [] 0: INFO 26-04-30 05:25:40.400305 - 13:50:21 - Removing folders: {PosixPath('/home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000045000')} 0: DEBUG 26-04-30 05:25:41.107715 - 13:50:21 - PyTorch version 2.8.0 available. 0: INFO 26-04-30 05:25:42.910361 - 13:50:23 - Consolidating to: /home/xun/rsadhukh/STEM/logs/midfine_base_final/checkpoints/0000050000/consolidated 0: INFO 26-04-30 05:26:29.420748 - 13:51:10 - Consolidated ! 0: INFO 26-04-30 05:26:29.437254 - 13:51:10 - Loading model (type=olmo3) 0: INFO 26-04-30 05:26:30.050010 - 13:51:10 - Using vocab_size=100352 from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/config.json (tokenizer has 100278 tokens) 0: INFO 26-04-30 05:26:30.051431 - 13:51:10 - HuggingFace tokenizer loaded from /data/rsadhukh/checkpoints/olmo2-1b-base-token4T/ – #words: 100352, BOS ID: 100257, EOS ID: 100257 0: INFO 26-04-30 05:26:54.981421 - 13:51:35 - Model loaded 0: DEBUG 26-04-30 05:27:27.563324 - 13:52:08 - Attempting to acquire lock 23106620490768 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock 0: DEBUG 26-04-30 05:27:27.571896 - 13:52:08 - Lock 23106620490768 not acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock, waiting 0.05 seconds ... 0: DEBUG 26-04-30 05:27:27.622314 - 13:52:08 - Attempting to acquire lock 23106620490768 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock 0: DEBUG 26-04-30 05:27:27.627657 - 13:52:08 - Lock 23106620490768 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock 0: DEBUG 26-04-30 05:27:27.631410 - 13:52:08 - open file: /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25/dataset_info.json 0: DEBUG 26-04-30 05:27:27.632859 - 13:52:08 - Attempting to release lock 23106620490768 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock 0: DEBUG 26-04-30 05:27:27.638481 - 13:52:08 - Lock 23106620490768 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_hellaswag_default_0.0.0_1b5e44df7eeeac25.lock 0: DEBUG 26-04-30 05:27:27.709968 - 13:52:08 - Attempting to acquire lock 23106625915472 on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock 0: DEBUG 26-04-30 05:27:27.714318 - 13:52:08 - Lock 23106625915472 not acquired on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock, waiting 0.05 seconds ... 0: DEBUG 26-04-30 05:27:27.764784 - 13:52:08 - Attempting to acquire lock 23106625915472 on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock 0: DEBUG 26-04-30 05:27:27.768637 - 13:52:08 - Lock 23106625915472 acquired on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock 0: DEBUG 26-04-30 05:27:27.769501 - 13:52:08 - open file: /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25/dataset_info.json 0: DEBUG 26-04-30 05:27:27.770713 - 13:52:08 - Attempting to release lock 23106625915472 on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock 0: DEBUG 26-04-30 05:27:27.774507 - 13:52:08 - Lock 23106625915472 released on /home/xun/.cache/huggingface/datasets/hellaswag/default/0.0.0/1b5e44df7eeeac25_builder.lock 0: DEBUG 26-04-30 05:27:30.895107 - 13:52:11 - Attempting to acquire lock 23106386125968 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_super_glue_boolq_0.0.0_a29da19d1bb560f5.lock 0: DEBUG 26-04-30 05:27:30.900839 - 13:52:11 - Lock 23106386125968 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_super_glue_boolq_0.0.0_a29da19d1bb560f5.lock 0: DEBUG 26-04-30 05:27:30.904434 - 13:52:11 - open file: /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5/dataset_info.json 0: DEBUG 26-04-30 05:27:30.905274 - 13:52:11 - Attempting to release lock 23106386125968 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_super_glue_boolq_0.0.0_a29da19d1bb560f5.lock 0: DEBUG 26-04-30 05:27:30.908928 - 13:52:11 - Lock 23106386125968 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_super_glue_boolq_0.0.0_a29da19d1bb560f5.lock 0: DEBUG 26-04-30 05:27:30.915272 - 13:52:11 - Attempting to acquire lock 23106630388368 on /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5_builder.lock 0: DEBUG 26-04-30 05:27:30.919646 - 13:52:11 - Lock 23106630388368 acquired on /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5_builder.lock 0: DEBUG 26-04-30 05:27:30.920452 - 13:52:11 - open file: /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5/dataset_info.json 0: DEBUG 26-04-30 05:27:30.921595 - 13:52:11 - Attempting to release lock 23106630388368 on /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5_builder.lock 0: DEBUG 26-04-30 05:27:30.925475 - 13:52:11 - Lock 23106630388368 released on /home/xun/.cache/huggingface/datasets/super_glue/boolq/0.0.0/a29da19d1bb560f5_builder.lock 0: DEBUG 26-04-30 05:27:31.408914 - 13:52:12 - Attempting to acquire lock 23090440323984 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock 0: DEBUG 26-04-30 05:27:31.413463 - 13:52:12 - Lock 23090440323984 not acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock, waiting 0.05 seconds ... 0: DEBUG 26-04-30 05:27:31.463881 - 13:52:12 - Attempting to acquire lock 23090440323984 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock 0: DEBUG 26-04-30 05:27:31.469047 - 13:52:12 - Lock 23090440323984 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock 0: DEBUG 26-04-30 05:27:31.469774 - 13:52:12 - open file: /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01/dataset_info.json 0: DEBUG 26-04-30 05:27:31.470564 - 13:52:12 - Attempting to release lock 23090440323984 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock 0: DEBUG 26-04-30 05:27:31.476204 - 13:52:12 - Lock 23090440323984 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_piqa_default_0.0.0_ad12f21308541b01.lock 0: DEBUG 26-04-30 05:27:31.479639 - 13:52:12 - Attempting to acquire lock 23090694007184 on /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01_builder.lock 0: DEBUG 26-04-30 05:27:31.483219 - 13:52:12 - Lock 23090694007184 acquired on /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01_builder.lock 0: DEBUG 26-04-30 05:27:31.483745 - 13:52:12 - open file: /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01/dataset_info.json 0: DEBUG 26-04-30 05:27:31.484776 - 13:52:12 - Attempting to release lock 23090694007184 on /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01_builder.lock 0: DEBUG 26-04-30 05:27:31.488256 - 13:52:12 - Lock 23090694007184 released on /home/xun/.cache/huggingface/datasets/piqa/default/0.0.0/ad12f21308541b01_builder.lock 0: DEBUG 26-04-30 05:27:31.907803 - 13:52:12 - Attempting to acquire lock 23106630395408 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock 0: DEBUG 26-04-30 05:27:31.912252 - 13:52:12 - Lock 23106630395408 not acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock, waiting 0.05 seconds ... 0: DEBUG 26-04-30 05:27:31.962541 - 13:52:12 - Attempting to acquire lock 23106630395408 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock 0: DEBUG 26-04-30 05:27:31.967334 - 13:52:12 - Lock 23106630395408 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock 0: DEBUG 26-04-30 05:27:31.968597 - 13:52:12 - open file: /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c/dataset_info.json 0: DEBUG 26-04-30 05:27:31.969579 - 13:52:12 - Attempting to release lock 23106630395408 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock 0: DEBUG 26-04-30 05:27:31.974716 - 13:52:12 - Lock 23106630395408 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_winogrande_winogrande_xl_0.0.0_18c0f92b2399136c.lock 0: DEBUG 26-04-30 05:27:31.978514 - 13:52:12 - Attempting to acquire lock 23090694002704 on /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c_builder.lock 0: DEBUG 26-04-30 05:27:31.982959 - 13:52:12 - Lock 23090694002704 acquired on /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c_builder.lock 0: DEBUG 26-04-30 05:27:31.983329 - 13:52:12 - open file: /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c/dataset_info.json 0: DEBUG 26-04-30 05:27:31.984194 - 13:52:12 - Attempting to release lock 23090694002704 on /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c_builder.lock 0: DEBUG 26-04-30 05:27:31.987548 - 13:52:12 - Lock 23090694002704 released on /home/xun/.cache/huggingface/datasets/winogrande/winogrande_xl/0.0.0/18c0f92b2399136c_builder.lock 0: DEBUG 26-04-30 05:27:32.911877 - 13:52:13 - Attempting to acquire lock 23106619172624 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock 0: DEBUG 26-04-30 05:27:32.914523 - 13:52:13 - Lock 23106619172624 not acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock, waiting 0.05 seconds ... 0: DEBUG 26-04-30 05:27:32.964931 - 13:52:13 - Attempting to acquire lock 23106619172624 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock 0: DEBUG 26-04-30 05:27:32.969395 - 13:52:13 - Lock 23106619172624 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock 0: DEBUG 26-04-30 05:27:32.970185 - 13:52:13 - open file: /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc/dataset_info.json 0: DEBUG 26-04-30 05:27:32.971027 - 13:52:13 - Attempting to release lock 23106619172624 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock 0: DEBUG 26-04-30 05:27:32.974893 - 13:52:13 - Lock 23106619172624 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_openbookqa_main_0.0.0_d5f895b4f0a071fc.lock 0: DEBUG 26-04-30 05:27:32.977556 - 13:52:13 - Attempting to acquire lock 23090599459920 on /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc_builder.lock 0: DEBUG 26-04-30 05:27:32.981396 - 13:52:13 - Lock 23090599459920 acquired on /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc_builder.lock 0: DEBUG 26-04-30 05:27:32.981987 - 13:52:13 - open file: /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc/dataset_info.json 0: DEBUG 26-04-30 05:27:32.982935 - 13:52:13 - Attempting to release lock 23090599459920 on /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc_builder.lock 0: DEBUG 26-04-30 05:27:32.987277 - 13:52:13 - Lock 23090599459920 released on /home/xun/.cache/huggingface/datasets/openbookqa/main/0.0.0/d5f895b4f0a071fc_builder.lock 0: DEBUG 26-04-30 05:27:33.186566 - 13:52:13 - Attempting to acquire lock 23090568443344 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Easy_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.192044 - 13:52:13 - Lock 23090568443344 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Easy_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.192824 - 13:52:13 - open file: /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed/dataset_info.json 0: DEBUG 26-04-30 05:27:33.193676 - 13:52:13 - Attempting to release lock 23090568443344 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Easy_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.198403 - 13:52:13 - Lock 23090568443344 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Easy_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.200721 - 13:52:13 - Attempting to acquire lock 23090568428176 on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.204488 - 13:52:14 - Lock 23090568428176 acquired on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.205319 - 13:52:14 - open file: /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed/dataset_info.json 0: DEBUG 26-04-30 05:27:33.206000 - 13:52:14 - Attempting to release lock 23090568428176 on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.208991 - 13:52:14 - Lock 23090568428176 released on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Easy/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.330889 - 13:52:14 - Attempting to acquire lock 23090568431376 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Challenge_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.335011 - 13:52:14 - Lock 23090568431376 acquired on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Challenge_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.339352 - 13:52:14 - open file: /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed/dataset_info.json 0: DEBUG 26-04-30 05:27:33.342280 - 13:52:14 - Attempting to release lock 23090568431376 on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Challenge_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.346803 - 13:52:14 - Lock 23090568431376 released on /home/xun/.cache/huggingface/datasets/_home_xun_.cache_huggingface_datasets_ai2_arc_ARC-Challenge_0.0.0_55eda3b29fc4b7ed.lock 0: DEBUG 26-04-30 05:27:33.350687 - 13:52:14 - Attempting to acquire lock 23090614595792 on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.354884 - 13:52:14 - Lock 23090614595792 acquired on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.355223 - 13:52:14 - open file: /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed/dataset_info.json 0: DEBUG 26-04-30 05:27:33.355975 - 13:52:14 - Attempting to release lock 23090614595792 on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed_builder.lock 0: DEBUG 26-04-30 05:27:33.359656 - 13:52:14 - Lock 23090614595792 released on /home/xun/.cache/huggingface/datasets/ai2_arc/ARC-Challenge/0.0.0/55eda3b29fc4b7ed_builder.lock 0: INFO 26-04-30 05:27:56.627830 - 13:52:37 - All evaluation results: {'arc_challenge': {'alias': 'arc_challenge', 'acc,none': 0.42235494880546076, 'acc_stderr,none': 0.014434138713379983, 'acc_norm,none': 0.45051194539249145, 'acc_norm_stderr,none': 0.014539646098471627}, 'arc_easy': {'alias': 'arc_easy', 'acc,none': 0.7563131313131313, 'acc_stderr,none': 0.00880917174472056, 'acc_norm,none': 0.7567340067340067, 'acc_norm_stderr,none': 0.00880400984686553}, 'boolq': {'alias': 'boolq', 'acc,none': 0.6938837920489297, 'acc_stderr,none': 0.008060817222724517}, 'hellaswag': {'alias': 'hellaswag', 'acc,none': 0.4953196574387572, 'acc_stderr,none': 0.004989562798280521, 'acc_norm,none': 0.6694881497709619, 'acc_norm_stderr,none': 0.00469436096892941}, 'openbookqa': {'alias': 'openbookqa', 'acc,none': 0.272, 'acc_stderr,none': 0.019920483209566072, 'acc_norm,none': 0.396, 'acc_norm_stderr,none': 0.021893529941665813}, 'piqa': {'alias': 'piqa', 'acc,none': 0.7486398258977149, 'acc_stderr,none': 0.010121156016819262, 'acc_norm,none': 0.7464635473340587, 'acc_norm_stderr,none': 0.010150090834551784}, 'winogrande': {'alias': 'winogrande', 'acc,none': 0.665351223362273, 'acc_stderr,none': 0.013261823629558363}} 0: INFO 26-04-30 05:27:56.628243 - 13:52:37 - Writing metric logs to /home/xun/rsadhukh/STEM/logs/midfine_base_final/metrics.eval.jsonl 0: INFO 26-04-30 05:27:56.632908 - 13:52:37 - Logged 24 eval metrics to wandb at step 50000